lucabadiali commited on
Commit
996d41a
·
1 Parent(s): 48aba2c
.gitignore CHANGED
@@ -6,4 +6,5 @@ data/dataset
6
  app/__pycache__
7
  src/app/__pycache__/__init__.cpython-311.pyc
8
  src/app/__pycache__/app.cpython-311.pyc
9
- src/app/__pycache__/utils.cpython-311.pyc
 
 
6
  app/__pycache__
7
  src/app/__pycache__/__init__.cpython-311.pyc
8
  src/app/__pycache__/app.cpython-311.pyc
9
+ src/app/__pycache__/utils.cpython-311.pyc
10
+ src/app/__pycache__/config.cpython-311.pyc
src/app/__pycache__/config.cpython-311.pyc ADDED
Binary file (1.67 kB). View file
 
src/train_model.py CHANGED
@@ -8,7 +8,9 @@ from transformers import (
8
  TrainingArguments, Trainer, EarlyStoppingCallback,
9
  DataCollatorWithPadding
10
  )
11
- from datasets import load_from_disk
 
 
12
 
13
 
14
  # --- Device detection ---
@@ -74,8 +76,12 @@ model.config.use_cache = False
74
  #### DATASET LOADING
75
 
76
 
77
- dataset_path = "data/dataset" # same path you used before
78
- dataset = load_from_disk(dataset_path)
 
 
 
 
79
 
80
 
81
  # ---- COPY-PASTE FROM HERE ----
 
8
  TrainingArguments, Trainer, EarlyStoppingCallback,
9
  DataCollatorWithPadding
10
  )
11
+ from datasets import load_dataset,load_from_disk
12
+ from pathlib import Path
13
+
14
 
15
 
16
  # --- Device detection ---
 
76
  #### DATASET LOADING
77
 
78
 
79
+ dataset_path = Path("data/dataset")
80
+ if dataset_path.exists():
81
+ dataset = load_from_disk(dataset_path)
82
+ else:
83
+ dataset = load_dataset('tweet_eval', 'sentiment')
84
+
85
 
86
 
87
  # ---- COPY-PASTE FROM HERE ----