Skip to content

Instantly share code, notes, and snippets.

@fabiobatalha
fabiobatalha / delayed.py
Last active August 29, 2015 14:04
Check delayed content
#!/usr/bin/python2.7
# coding: utf-8
import unittest
import datetime
def is_delayed(ratio, periodicity, last_publication_date):
"""
ratio (integer): numero de fasciculos para considerar o atraso.
periodicity (integer): periodicidade do periodico em meses 1, 2, 3, 4, 5.....
import json
import urllib, urllib2
import urlparse
from unidecode import unidecode
CROSSREF_API_DOI = 'http://search.crossref.org/dois?'
def verify_doi(doi,article):
doi_query_url = 'http://search.crossref.org/dois?' + urllib.urlencode({'q': doi})
response = json.loads(urllib2.urlopen(doi_query_url).read())
@fabiobatalha
fabiobatalha / books.py
Last active August 29, 2015 13:56
Tabula livros armazenados no couchdb
# coding: utf-8
import json
import urllib2
books = json.loads(urllib2.urlopen('http:/127.0.0.1:5984/scielobooks_1a/_design/scielobooks/_view/books').read())
for row in books['rows']:
print u'|'.join(
[
@fabiobatalha
fabiobatalha / finddoi.py
Last active December 20, 2015 06:49
API to query DOI's to Crossref according to a given metadata.
# encoding: utf-8
import urllib2
from xml.etree import ElementTree
from xml.etree.ElementTree import Element
from urllib import urlencode
class FindDoi(object):
def __init__(self, format='unixref'):
@fabiobatalha
fabiobatalha / get_stats_books.py
Created June 26, 2013 20:11
Script para coletar dados de acessos registrados no mongodb e tabular em mês e ano.
#!/usr/bin/env python
import os
import urllib2
import json
import argparse
import pymongo
def get_books(api_host='localhost', api_port='5984'):
@fabiobatalha
fabiobatalha / load_remarks.py
Last active December 18, 2015 00:59
load_remarks.py
import os
import re
from lxml import etree
ns = {'xs': 'http://www.w3.org/2001/XMLSchema',
'mml': 'http://www.w3.org/1998/Math/MathML',
'xsi': 'http://www.w3.org/2001/XMLSchema-instance',
'xlink': 'http://www.w3.org/1999/xlink'}
@fabiobatalha
fabiobatalha / memento.py
Last active January 20, 2023 09:29
Memento Design Pattern sample in Python
#!/usr/bin/python
import copy
class Originator(object):
class Memento(object):
def __init__(self, mstate):
self.mstate = mstate
@fabiobatalha
fabiobatalha / html_colector.py
Last active December 16, 2015 04:09
Script para carregar texto completo de pressreleases em arquivos html
#!/usr/bin/env python
# coding: utf-8
import os
import shutil
import argparse
import json
def dict_articles_press_releases(cisis_path, scielo_path):
query = os.popen('''{0}/mx {1}/bases/artigo/artigo btell=0 lw=0 AHPR=$ pft="v880,'|',v881,'|',v241^i/" -all now'''.format(cisis_path, scielo_path))