forked from CMSROMA/Utilities
-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathremove_dup.awk
58 lines (52 loc) · 1.45 KB
/
remove_dup.awk
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
BEGIN{
old=0;
new =0;
line="";
dup="";
fsize_new=-1;
}
(NR!=0){
if(match($0,"[0-9]*_[0-9]*_[0-9a-zA-Z][0-9a-zA-Z][0-9a-zA-Z]\.root")){ # if the file is a typical castor output
end=substr($1,RSTART);
start=substr($1,0,RSTART);
n = split(end, end_, "_");
# print n, $0 >> "/dev/stderr"
# print end_[1], end_[2], end_[3], " -- ", $2 >> "/dev/stderr"
if(match(end_[3],"[a-zA-Z]+.*\.root")){ # se soddisfa anche a questa,
# allora e' prodotto da crab server
if(end_[1]!=old || start!=old_start){
# print the old line
print line
old=end_[1];
new =end_[2];
old_start=start;
line = $0;
fsize_old=$2
} else {
#print end_[1], end_[2], end_[3];
if(end_[2]>new || $2>fsize_old){
string1="basename "line
string2="basename "$0
string2 | getline filename_new
string1 | getline filename_old
print "[STATUS] "string1, string2 >> "/dev/stderr"
print "[STATUS] removing "filename_old" as duplicate of "filename_new"" >> "/dev/stderr"
new = end_[2];
line = $0;
fsize_old=fsize_new;
fsize_new=$2;
} else{
string1="basename "line
string2="basename "$0
string2 | getline filename_new
string1 | getline filename_old
print "[STATUS] "string1, string2 >> "/dev/stderr"
print "[STATUS] removing "filename_new" as duplicate of "filename_old"" >> "/dev/stderr"
}
}
} else print $0
} else print $0
}
END{
if(line!="") print line
}