Gang Li leebird

## python2_unicode_string.py
# -*- coding: utf-8 -*-
# Test various characteristics of Unicode string in Python 2.
# In Python 2, we have 2 types to store string data, str and unicode.
# The type str is like a byte string, while the type unicode stores
# unicode codepoints, with each being represented by one or more bytes.

# Define a simple ASCII string, the type is str.
ascii_a = 'abcdefg'
print 'OUTPUT 1'
print type(ascii_a)

## split_sent.py
''' Initialization: install NLTK python module and download data.
$ pip install nltk
$ echo 'import nltk; nltk.download("punkt")' | python
'''

from __future__ import print_function, unicode_literals
import nltk.data

_sent_detector = nltk.data.load('tokenizers/punkt/english.pickle')

## mirna_ner_api.py
from __future__ import print_function, unicode_literals
import json
import urllib
import urllib2

# The API URL.
api_url = 'http://research.bioinformatics.udel.edu/miRTex/ner'

# The documents to be processed.
documents = {

## tag_and_score.py
# Note that this is not a standalone script. It has dependencies.
# Here it is just used as an example illustrating the scoring
# process for miRTex results.

from __future__ import unicode_literals, print_function
import pickle
import os
import codecs
import sys
import re

## converter.py
from __future__ import unicode_literals
import sys
import codecs
import json
from lxml import etree

# See http://lxml.de/api.html#incremental-xml-generation
# for incremental XML generation used below.


## document_pb2.py
# Generated by the protocol buffer compiler.  DO NOT EDIT!
# source: document.proto

import sys
_b=sys.version_info[0]<3 and (lambda x:x) or (lambda x:x.encode('latin1'))
from google.protobuf import descriptor as _descriptor
from google.protobuf import message as _message
from google.protobuf import reflection as _reflection
from google.protobuf import symbol_database as _symbol_database
from google.protobuf import descriptor_pb2
	# -- coding: utf-8 --
	# Test various characteristics of Unicode string in Python 2.
	# In Python 2, we have 2 types to store string data, str and unicode.
	# The type str is like a byte string, while the type unicode stores
	# unicode codepoints, with each being represented by one or more bytes.

	# Define a simple ASCII string, the type is str.
	ascii_a = 'abcdefg'
	print 'OUTPUT 1'
	print type(ascii_a)
	''' Initialization: install NLTK python module and download data.
	$ pip install nltk
	$ echo 'import nltk; nltk.download("punkt")' \| python
	'''

	from __future__ import print_function, unicode_literals
	import nltk.data

	_sent_detector = nltk.data.load('tokenizers/punkt/english.pickle')
	from __future__ import print_function, unicode_literals
	import json
	import urllib
	import urllib2

	# The API URL.
	api_url = 'http://research.bioinformatics.udel.edu/miRTex/ner'

	# The documents to be processed.
	documents = {
	# Note that this is not a standalone script. It has dependencies.
	# Here it is just used as an example illustrating the scoring
	# process for miRTex results.

	from __future__ import unicode_literals, print_function
	import pickle
	import os
	import codecs
	import sys
	import re
	from __future__ import unicode_literals
	import sys
	import codecs
	import json
	from lxml import etree

	# See http://lxml.de/api.html#incremental-xml-generation
	# for incremental XML generation used below.
	# Generated by the protocol buffer compiler. DO NOT EDIT!
	# source: document.proto

	import sys
	_b=sys.version_info[0]<3 and (lambda x:x) or (lambda x:x.encode('latin1'))
	from google.protobuf import descriptor as _descriptor
	from google.protobuf import message as _message
	from google.protobuf import reflection as _reflection
	from google.protobuf import symbol_database as _symbol_database
	from google.protobuf import descriptor_pb2