Register
Login
Resources
Docs Blog Datasets Glossary Case Studies Tutorials & Webinars
Product
Data Engine LLMs Platform Enterprise
Pricing Explore
Connect to our Discord channel

process_files.py 2.7 KB

You have to be logged in to leave a comment. Sign In
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
  1. import os, shutil
  2. import conf
  3. # The path to the directory where the original
  4. # dataset was uncompressed
  5. original_dataset_dir = os.path.join(conf.data_dir, 'train')
  6. # The directory where we will
  7. # store our smaller dataset
  8. os.mkdir(conf.base_dir)
  9. # Directories for our training,
  10. # validation and test splits
  11. os.mkdir(conf.train_dir)
  12. os.mkdir(conf.validation_dir)
  13. os.mkdir(conf.test_dir)
  14. # Directory with our training cat pictures
  15. train_cats_dir = os.path.join(conf.train_dir, 'cats')
  16. os.mkdir(train_cats_dir)
  17. # Directory with our training dog pictures
  18. train_dogs_dir = os.path.join(conf.train_dir, 'dogs')
  19. os.mkdir(train_dogs_dir)
  20. # Directory with our validation cat pictures
  21. validation_cats_dir = os.path.join(conf.validation_dir, 'cats')
  22. os.mkdir(validation_cats_dir)
  23. # Directory with our validation dog pictures
  24. validation_dogs_dir = os.path.join(conf.validation_dir, 'dogs')
  25. os.mkdir(validation_dogs_dir)
  26. # Directory with our validation cat pictures
  27. test_cats_dir = os.path.join(conf.test_dir, 'cats')
  28. os.mkdir(test_cats_dir)
  29. # Directory with our validation dog pictures
  30. test_dogs_dir = os.path.join(conf.test_dir, 'dogs')
  31. os.mkdir(test_dogs_dir)
  32. # Copy first 1000 cat images to train_cats_dir
  33. fnames = ['cat.{}.jpg'.format(i) for i in range(1000)]
  34. for fname in fnames:
  35. src = os.path.join(original_dataset_dir, fname)
  36. dst = os.path.join(train_cats_dir, fname)
  37. shutil.copyfile(src, dst)
  38. # Copy next 500 cat images to validation_cats_dir
  39. fnames = ['cat.{}.jpg'.format(i) for i in range(1000, 1500)]
  40. for fname in fnames:
  41. src = os.path.join(original_dataset_dir, fname)
  42. dst = os.path.join(validation_cats_dir, fname)
  43. shutil.copyfile(src, dst)
  44. # Copy next 500 cat images to test_cats_dir
  45. fnames = ['cat.{}.jpg'.format(i) for i in range(1500, 2000)]
  46. for fname in fnames:
  47. src = os.path.join(original_dataset_dir, fname)
  48. dst = os.path.join(test_cats_dir, fname)
  49. shutil.copyfile(src, dst)
  50. # Copy first 1000 dog images to train_dogs_dir
  51. fnames = ['dog.{}.jpg'.format(i) for i in range(1000)]
  52. for fname in fnames:
  53. src = os.path.join(original_dataset_dir, fname)
  54. dst = os.path.join(train_dogs_dir, fname)
  55. shutil.copyfile(src, dst)
  56. # Copy next 500 dog images to validation_dogs_dir
  57. fnames = ['dog.{}.jpg'.format(i) for i in range(1000, 1500)]
  58. for fname in fnames:
  59. src = os.path.join(original_dataset_dir, fname)
  60. dst = os.path.join(validation_dogs_dir, fname)
  61. shutil.copyfile(src, dst)
  62. # Copy next 500 dog images to test_dogs_dir
  63. fnames = ['dog.{}.jpg'.format(i) for i in range(1500, 2000)]
  64. for fname in fnames:
  65. src = os.path.join(original_dataset_dir, fname)
  66. dst = os.path.join(test_dogs_dir, fname)
  67. shutil.copyfile(src, dst)
Tip!

Press p or to see the previous file or, n or to see the next file

Comments

Loading...