-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdvc
44 lines (33 loc) · 1 KB
/
dvc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
# workflow for dvc
# install dvc dvc[s3] through pip or package manager
# authorize with s3 storage using appropriate config files
pip install dvc dvc[s3]
# for dvc-data command
pip install dvc-data[cli]
# some times boto should be added additionally.
pip instal boto
# install using conda
conda install -c conda-forge dvc
# might be better to install using pip since dvc[cli] can only be installed using pip
# Step 1: initialize DVC
dvc init
# Step 2: DVC stages some files and you just need to commit it
git commit -m "Initialize DVC"
# Step 3: add data
dvc add path/to/data
git add path/to/data.dvc path/to/.gitignore
git commit -m "added data to storage"
git push
# Step 4(optional): if you use remote storage
# push to dvc
dvc push
# see status
dvc status
# checkout the version of data from last commit
dvc checkout
# checkout specific file
dvc checkout -- /path/to/file
# list file tracked by dvc in current directory
dvc list --dvc-only <path>
# compute the hash for a directory
dvc-data build /path/to/dir