Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
DataScienceUWL
GitHub Repository: DataScienceUWL/DS775
Path: blob/main/Lessons/Lesson 14 - RecSys 2/resources/data/movielens/mku.sh
871 views
1
#!/bin/sh
2
3
trap `rm -f tmp.$$; exit 1` 1 2 15
4
5
for i in 1 2 3 4 5
6
do
7
head -`expr $i \* 20000` u.data | tail -20000 > tmp.$$
8
sort -t" " -k 1,1n -k 2,2n tmp.$$ > u$i.test
9
head -`expr \( $i - 1 \) \* 20000` u.data > tmp.$$
10
tail -`expr \( 5 - $i \) \* 20000` u.data >> tmp.$$
11
sort -t" " -k 1,1n -k 2,2n tmp.$$ > u$i.base
12
done
13
14
allbut.pl ua 1 10 100000 u.data
15
sort -t" " -k 1,1n -k 2,2n ua.base > tmp.$$
16
mv tmp.$$ ua.base
17
sort -t" " -k 1,1n -k 2,2n ua.test > tmp.$$
18
mv tmp.$$ ua.test
19
20
allbut.pl ub 11 20 100000 u.data
21
sort -t" " -k 1,1n -k 2,2n ub.base > tmp.$$
22
mv tmp.$$ ub.base
23
sort -t" " -k 1,1n -k 2,2n ub.test > tmp.$$
24
mv tmp.$$ ub.test
25
26
27