dayannex commited on
Commit
389be27
·
1 Parent(s): 8ca847a

app modified dataset reorden token

Browse files
Files changed (1) hide show
  1. app.py +18 -1
app.py CHANGED
@@ -364,7 +364,24 @@ class ModeloDataset:
364
  i=i+1
365
  labels = predicted_token_class_ids
366
  loss = self.model(input_ids, labels=labels).loss
367
- return ids,_predicted_tokens_classes
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
368
  else:
369
 
370
  print('idioma:',idioma)
 
364
  i=i+1
365
  labels = predicted_token_class_ids
366
  loss = self.model(input_ids, labels=labels).loss
367
+
368
+ new_tokens=[]
369
+ ig_tok=[]
370
+ i=0
371
+ new_identificadores=[]
372
+ for item in tokenized_text:
373
+
374
+ aux1, aux2= self.reordenacion_tokens(item,"_")
375
+ new_tokens.append(aux1)
376
+ ig_tok.append(aux2)
377
+
378
+
379
+ for items in _predicted_tokens_classes:
380
+ aux=self.reordenacion_identificadores(ig_tok[i],items,len(new_tokens[i]))
381
+ new_identificadores.append(aux)
382
+ i=i+1
383
+
384
+ return new_identificadores, new_tokens#ids,_predicted_tokens_classes
385
  else:
386
 
387
  print('idioma:',idioma)