Last active
December 15, 2017 05:51
-
-
Save hhachiya/63181abf5dfddef301897bfe6028263d to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# -*- coding: utf-8 -*- | |
import os | |
import pandas as pd | |
import numpy as np | |
#------------------- | |
# クラスの定義始まり | |
class sentence: | |
dataPath = 'sentiment_labelled_sentences' # データのフォルダ名 | |
#------------------------------------ | |
# CSVファイルの読み込み | |
# fname: ファイルパス(文字列) | |
def __init__(self,fname): | |
# ファイルのパス設定 | |
fullpath = os.path.join(self.dataPath,fname) | |
# csv形式のデータ読み込み | |
self.data = pd.read_csv(fullpath,'\t') | |
#------------------------------------ | |
#------------------------------------ | |
# 文字列検索 | |
# keyword: 検索キーワード(文字列) | |
def search(self, keyword): | |
# sentence列で、keywordを含む要素のインデックスを取得 | |
results = self.data['sentence'].str.contains(keyword) | |
# np.arrayとして返す | |
return self.data['sentence'][results].values | |
#------------------------------------ | |
# クラスの定義終わり | |
#------------------- | |
#------------------- | |
# メインの始まり | |
if __name__ == "__main__": | |
# データファイルamazon_cells_labelled.txtを指定して、インスタンス化 | |
myData = sentence("amazon_cells_labelled.txt") | |
# 検索 | |
results = myData.search("very good") | |
# 検索結果の表示 | |
for ind in np.arange(len(results)): | |
print(ind,":",results[ind]) | |
#メインの終わり | |
#------------------- |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment