-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathsamples.py
81 lines (75 loc) · 1.31 KB
/
samples.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
DOG_SAMPLES = '''
SAMN06172495
SAMN06172481
SAMN06172523
SAMN06172473
SAMN06172512
SAMN06172522
SAMN06172491
SAMN06172421
SAMN06172511
SAMN06172505
SAMN06172453
SAMN06172443
SAMN06172444
SAMN06172445
SAMN06172446
SAMN06172447
SAMN06172448
SAMN06172449
SAMN06172450
SAMN06172451
'''
DOG_SAMPLES = [ell.strip() for ell in DOG_SAMPLES.strip().split('\n')]
DOG_STUDY = 'Coelho_dogs_2018'
ZELLER_SAMPLES = '''
SAMEA4817960
SAMEA4817939
SAMEA4817907
SAMEA4817900
SAMEA4817972
SAMEA4817969
SAMEA4817928
SAMEA4817943
SAMEA4817947
SAMEA4817948
SAMEA4817949
SAMEA4817950
SAMEA4817951
SAMEA4817952
SAMEA4817953
SAMEA4817954
SAMEA4817955
SAMEA4817956
SAMEA4817957
SAMEA4817958
'''
ZELLER_SAMPLES = [('PAIRED/'+ell.strip()) for ell in ZELLER_SAMPLES.strip().split('\n')]
ZELLER_STUDY = 'Zeller_CRC_2014'
TARA_SAMPLES = '''
SAMEA2591057
SAMEA2591074
SAMEA2591084
SAMEA2591098
SAMEA2591107
SAMEA2591108
SAMEA2591122
SAMEA2591132
SAMEA2619376
SAMEA2619399
SAMEA2619531
SAMEA2619548
SAMEA2619625
SAMEA2619667
SAMEA2619677
SAMEA2619678
SAMEA2619686
SAMEA2619747
SAMEA2619766
SAMEA2619779
'''
TARA_SAMPLES = [('PAIRED/'+ell.strip()) for ell in TARA_SAMPLES.strip().split('\n')]
TARA_STUDY = 'TaraOceans'
assert len(DOG_SAMPLES) == len(set(DOG_SAMPLES))
assert len(ZELLER_SAMPLES) == len(set(ZELLER_SAMPLES))
assert len(TARA_SAMPLES) == len(set(TARA_SAMPLES))