2024-03-24 12:13:05 +01:00
|
|
|
#!/bin/bash
|
|
|
|
|
|
|
|
# Count the number of lines in the original dataset
|
2024-03-24 12:30:04 +01:00
|
|
|
wc -l < data/creditcard_shuf.csv > stats.txt
|
2024-03-24 12:13:05 +01:00
|
|
|
# Count the number of lines in the training and testing datasets
|
2024-03-24 12:30:04 +01:00
|
|
|
wc -l < data/creditcard_train.csv > stats_train.txt
|
2024-03-24 12:34:40 +01:00
|
|
|
wc -l < data/creditcard_test.csv > stats_test.txt
|
2024-03-24 12:13:05 +01:00
|
|
|
|
2024-03-24 12:35:23 +01:00
|
|
|
# Create a directory for the statistics
|
2024-03-24 12:55:09 +01:00
|
|
|
mkdir -p stats_data
|
2024-03-24 12:35:23 +01:00
|
|
|
# Move the statistics to the stats directory
|
2024-03-24 12:55:09 +01:00
|
|
|
mv stats.txt stats_train.txt stats_test.txt stats_data/
|