diff --git a/hft.py b/hft.py index 7f4292f..62c63e6 100644 --- a/hft.py +++ b/hft.py @@ -207,7 +207,7 @@ def main(): print("\nBrak danych do treningu!") return - dataset = Dataset.from_list(data) + dataset = Dataset.from_dict({k: [dic[k] for dic in data] for k in data[0]}) def tokenize_function(examples): tokenized = tokenizer(