Skip to content

Commit

Permalink
First commit with setup and DVC files
Browse files Browse the repository at this point in the history
  • Loading branch information
Ubuntu committed May 3, 2024
1 parent 5aad06f commit d4f6285
Show file tree
Hide file tree
Showing 7 changed files with 24 additions and 5 deletions.
3 changes: 3 additions & 0 deletions .dvc/.gitignore
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
/config.local
/tmp
/cache
6 changes: 6 additions & 0 deletions .dvc/config
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
[core]
remote = remote_storage
['remote "remote_storage"']
url = ../../dvc_remote
['remote "remote_gdrive"']
url = gdrive://1IDOqFaErwMk0BnK2_W2bYrodEE-mCVnN
3 changes: 3 additions & 0 deletions .dvcignore
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
# Add patterns of files dvc should ignore, which could improve
# the performance. Learn more at
# https://dvc.org/doc/user-guide/dvcignore
2 changes: 1 addition & 1 deletion .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -79,7 +79,7 @@ target/
.ipynb_checkpoints/

# exclude data from source control by default
/data/
#/data/

# Mac OS-specific storage files
.DS_Store
Expand Down
1 change: 1 addition & 0 deletions data/.gitignore
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
/raw
6 changes: 6 additions & 0 deletions data/raw.dvc
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
outs:
- md5: 90c3e04bb8fa1558eb70f9096b5b6010.dir
size: 31082914
nfiles: 4
hash: md5
path: raw
8 changes: 4 additions & 4 deletions src/data/make_dataset.py
Original file line number Diff line number Diff line change
Expand Up @@ -21,10 +21,10 @@ def main(input_filepath, output_filepath):

# Prompt the user for input file paths
input_filepath= click.prompt('Enter the file path for the input data', type=click.Path(exists=True))
input_filepath_users = f"{input_filepath}\\usagers-2021.csv"
input_filepath_caract = f"{input_filepath}\\caracteristiques-2021.csv"
input_filepath_places = f"{input_filepath}\\lieux-2021.csv"
input_filepath_veh = f"{input_filepath}\\vehicules-2021.csv"
input_filepath_users = f"{input_filepath}/usagers-2021.csv"
input_filepath_caract = f"{input_filepath}/caracteristiques-2021.csv"
input_filepath_places = f"{input_filepath}/lieux-2021.csv"
input_filepath_veh = f"{input_filepath}/vehicules-2021.csv"
output_filepath = click.prompt('Enter the file path for the output preprocessed data (e.g., output/preprocessed_data.csv)', type=click.Path())

# Call the main data processing function with the provided file paths
Expand Down

0 comments on commit d4f6285

Please sign in to comment.