nicholasKluge commited on
Commit
173b43f
·
1 Parent(s): 58c56e0

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -8,10 +8,11 @@ from sklearn.feature_extraction.text import TfidfVectorizer
8
  from transformers import AutoTokenizer, AutoModelForCausalLM, AutoModelForSequenceClassification
9
 
10
  # download the instruct-aira-dataset
11
- dataset = load_dataset("nicholasKluge/instruct-aira-dataset", split='portuguese')
 
12
 
13
  # convert the dataset to a pandas dataframe
14
- df = dataset.to_pandas()
15
 
16
  # rename the columns
17
  df.columns = ['Prompt', 'Completion']
 
8
  from transformers import AutoTokenizer, AutoModelForCausalLM, AutoModelForSequenceClassification
9
 
10
  # download the instruct-aira-dataset
11
+ #dataset = load_dataset("nicholasKluge/instruct-aira-dataset", split='portuguese')
12
+ dataset = load_dataset("parquet", data_files="instruct-aira-dataset.parquet")
13
 
14
  # convert the dataset to a pandas dataframe
15
+ df = dataset['train'].to_pandas()
16
 
17
  # rename the columns
18
  df.columns = ['Prompt', 'Completion']