Skip to content

Instantly share code, notes, and snippets.

@paulodiogo
Last active June 11, 2020 19:49
Show Gist options
  • Save paulodiogo/879992e81e3e001055b9136231c1a04c to your computer and use it in GitHub Desktop.
Save paulodiogo/879992e81e3e001055b9136231c1a04c to your computer and use it in GitHub Desktop.
NAI
import pandas as pd
import math
df = pd.read_excel("tabela3218.xlsx")
DADOS = {}
COLUNA1 = []
COLUNA2 = []
for index, row in df.iterrows():
if index == 3:
for i in range(3, len(row), 8):
COLUNA1.append(row[i])
if index == 5:
for i in range(3, len(row), 8):
COLUNA2.append(row[i])
DADOS = {'COLUNA1': COLUNA1, 'COLUNA2': COLUNA2}
df = pd.DataFrame(DADOS, columns=['COLUNA1', 'COLUNA2'])
df.to_excel("output.xlsx", index=False)
import pandas as pd
import math
df = pd.read_excel("tabela3218.xlsx")
DADOS = {}
COLUNAS_SELECIONADAS = [3, 11]
LABEL_COLUNAS = ['A','B']
DADOS = {}
for a in LABEL_COLUNAS:
DADOS[a] = []
for index, row in df.iterrows():
if index >= 5:
COLUNA = []
for i in range(0, len(COLUNAS_SELECIONADAS)):
if not math.isnan(row[COLUNAS_SELECIONADAS[i]]):
DADOS[LABEL_COLUNAS[i]].append(row[COLUNAS_SELECIONADAS[i]])
df = pd.DataFrame(DADOS, columns=LABEL_COLUNAS)
df.to_excel("output.xlsx", index=False)
import pandas as pd
import math
df = pd.read_excel(str(sys.argv[1]))
DADOS = {}
COLUNAS_SELECIONADAS = list(map(int, sys.argv[2].split(',')))
LABEL_COLUNAS = list(sys.argv[3].split(','))
DADOS = {}
for a in LABEL_COLUNAS:
DADOS[a] = []
for index, row in df.iterrows():
if index >= 5:
COLUNA = []
for i in range(0, len(COLUNAS_SELECIONADAS)):
if not math.isnan(row[COLUNAS_SELECIONADAS[i]]):
DADOS[LABEL_COLUNAS[i]].append(row[COLUNAS_SELECIONADAS[i]])
df = pd.DataFrame(DADOS, columns=LABEL_COLUNAS)
df.to_excel("output.xlsx", index=False)
import pandas as pd
import math
df = pd.read_excel("tabela3218.xlsx")
DADOS = {}
COLUNA1 = []
COLUNA2 = []
for index, row in df.iterrows():
if index >= 5:
if not math.isnan(row[3]):
COLUNA1.append(row[3])
if not math.isnan(row[11]):
COLUNA2.append(row[11])
DADOS = {'COLUNA1': COLUNA1, 'COLUNA2': COLUNA2}
df = pd.DataFrame(DADOS, columns=['COLUNA1', 'COLUNA2'])
df.to_excel("output.xlsx", index=False)

Antes de rodar

  • pip install pandas
  • pip install openpyxl
  • pip install xlrd

Rodar

  • python extractor.py
  • python extractor-final-form.py

para o params vc deve passar o path do arquivo e as colunas que vc precisa e os nomes que vc quer dar (separado por virgula)

  • python extractor-param.py tabela3218.xlsx 3,11 A,B
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment