Skip to content

Instantly share code, notes, and snippets.

@Soumi7
Created June 23, 2020 12:20
Show Gist options
  • Save Soumi7/0fb9c5f9dad0d6bd43f652d395517693 to your computer and use it in GitHub Desktop.
Save Soumi7/0fb9c5f9dad0d6bd43f652d395517693 to your computer and use it in GitHub Desktop.
Parser
import pandas as pd
df=pd.read_csv("drive/My Drive/Data.csv")
Sentences=df['Text']
df['Labels'] = df['Unnamed: 1'].astype(str) +" "+ df['Unnamed: 2'].astype(str)+" "+ df['Unnamed: 3'].astype(str)+" "+ df['Unnamed: 4'].astype(str)+" "+ df['Unnamed: 5'].astype(str)+" "+ df['Unnamed: 6'].astype(str)+" "+ df['Unnamed: 7'].astype(str)+" "+ df['Unnamed: 8'].astype(str)+" "+ df['Unnamed: 9'].astype(str)+" "+ df['Unnamed: 10'].astype(str)+" "+ df['Unnamed: 11'].astype(str)
df=df.drop(columns=['Unnamed: 1', 'Unnamed: 2', 'Unnamed: 3', 'Unnamed: 4',
'Unnamed: 5', 'Unnamed: 6', 'Unnamed: 7', 'Unnamed: 8', 'Unnamed: 9',
'Unnamed: 10', 'Unnamed: 11'],axis=1)
Labels=df['Labels']
traindata=[]
for i in range(0,len(Sentences[:95])):
wordslist=Sentences[i].split(" ")
labelslist=Labels[i].split(" ")
for j in range(0,len(wordslist[:95])):
traindata.append([i,wordslist[j],labelslist[j]])
testdata=[]
for i in range(95,105):
wordslist=Sentences[i].split(" ")
labelslist=Labels[i].split(" ")
for j in range(0,len(wordslist)):
testdata.append([i-95,wordslist[j],labelslist[j]])
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment