forked from OpenGVLab/VideoMAEv2
-
Notifications
You must be signed in to change notification settings - Fork 0
/
lrw_data_prepare.py
88 lines (84 loc) · 9.63 KB
/
lrw_data_prepare.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
import os
CATEGORY = {'UNION': 0, 'BECOME': 1, 'COMPANIES': 2, 'NUMBERS': 3, 'CHILDREN': 4, 'TEMPERATURES': 5, 'BUILD': 6, 'ANOTHER': 7,
'ECONOMY': 8, 'PARTIES': 9, 'FUTURE': 10, 'SERIOUS': 11, 'SIMPLY': 12, 'FOREIGN': 13, 'SINGLE': 14, 'SEEMS': 15,
'INCREASE': 16, 'VICTIMS': 17, 'NEVER': 18, 'RIGHTS': 19, 'AUTHORITIES': 20, 'MONTH': 21, 'EMERGENCY': 22, 'CLOUD': 23,
'SOUTH': 24, 'MILLION': 25, 'SHORT': 26, 'FRANCE': 27, 'JUSTICE': 28, 'SERVICE': 29, 'AGREE': 30, 'INVOLVED': 31,
'COUNCIL': 32, 'RATHER': 33, 'RATES': 34, 'HAPPENING': 35, 'GUILTY': 36, 'ELECTION': 37, 'LEVEL': 38, 'REFERENDUM': 39,
'AFRICA': 40, 'ENOUGH': 41, 'LATER': 42, 'MEETING': 43, 'WATER': 44, 'RUSSIAN': 45, 'MARKET': 46, 'LEADER': 47, 'WANTS': 48,
'MIDDLE': 49, 'OFFICE': 50, 'GOING': 51, 'SCOTLAND': 52, 'MINISTER': 53, 'WARNING': 54, 'WALES': 55, 'STREET': 56,
'SOMETHING': 57, 'GETTING': 58, 'CHANCE': 59, 'STAND': 60, 'FOOTBALL': 61, 'SITUATION': 62, 'CANCER': 63, 'CHINA': 64,
'PRICES': 65, 'PUBLIC': 66, 'QUESTIONS': 67, 'SENSE': 68, 'PARENTS': 69, 'TALKING': 70, 'MEDICAL': 71, 'CRIME': 72,
'RETURN': 73, 'BECAUSE': 74, 'INDUSTRY': 75, 'PRIME': 76, 'PAYING': 77, 'OPERATION': 78, 'ABSOLUTELY': 79, 'FRENCH': 80,
'PROCESS': 81, 'TOWARDS': 82, 'ISLAMIC': 83, 'OTHERS': 84, 'LARGE': 85, 'HEAVY': 86, 'ANYTHING': 87, 'OTHER': 88,
'TERMS': 89, 'REMEMBER': 90, 'WEEKEND': 91, 'SCHOOLS': 92, 'DESCRIBED': 93, 'TRYING': 94, 'SYRIA': 95, 'AMERICAN': 96,
'GREAT': 97, 'HOSPITAL': 98, 'PERSONAL': 99, 'RECENT': 100, 'AGAINST': 101, 'AMERICA': 102, 'ORDER': 103, 'WOULD': 104,
'CERTAINLY': 105, 'WEEKS': 106, 'NOTHING': 107, 'CAPITAL': 108, 'LATEST': 109, 'FORCE': 110, 'LEVELS': 111, 'GROUND': 112,
'MEASURES': 113, 'CANNOT': 114, 'ASKING': 115, 'MANCHESTER': 116, 'LIVES': 117, 'FORWARD': 118, 'TAKING': 119, 'AGAIN': 120,
'EVENING': 121, 'EXAMPLE': 122, 'NIGHT': 123, 'SYRIAN': 124, 'WELCOME': 125, 'FRONT': 126, 'PATIENTS': 127, 'WATCHING': 128,
'BRITAIN': 129, 'CUSTOMERS': 130, 'CHANGE': 131, 'WORKING': 132, 'WHILE': 133, 'AHEAD': 134, 'NATIONAL': 135,
'CONFERENCE': 136, 'MAKES': 137, 'PLANS': 138, 'FACING': 139, 'CHARGE': 140, 'HOURS': 141, 'WHICH': 142, 'COUNTRY': 143,
'RESPONSE': 144, 'WEAPONS': 145, 'STARTED': 146, 'EVIDENCE': 147, 'DOING': 148, 'MEDIA': 149, 'TAKEN': 150, 'STORY': 151,
'EXACTLY': 152, 'AMOUNT': 153, 'BIGGEST': 154, 'CAMERON': 155, 'DETAILS': 156, 'HEALTH': 157, 'MASSIVE': 158,
'VIOLENCE': 159, 'EVERYONE': 160, 'MAKING': 161, 'LITTLE': 162, 'FAMILIES': 163, 'STILL': 164, 'MINUTES': 165, 'HEART': 166,
'NORTH': 167, 'EXPECT': 168, 'POLITICS': 169, 'ISSUE': 170, 'DIFFERENT': 171, 'WAITING': 172, 'COMES': 173,
'POLITICIANS': 174, 'CHANGES': 175, 'UNDERSTAND': 176, 'WORLD': 177, 'SECRETARY': 178, 'ANNOUNCED': 179, 'FIGHT': 180,
'PRESS': 181, 'BENEFIT': 182, 'FIGURES': 183, 'SUNSHINE': 184, 'SPEND': 185, 'GENERAL': 186, 'MORNING': 187, 'WRONG': 188,
'LONGER': 189, 'CLOSE': 190, 'AFTERNOON': 191, 'STAFF': 192, 'AFFAIRS': 193, 'INQUIRY': 194, 'DAVID': 195, 'POINT': 196,
'INSIDE': 197, 'SECTOR': 198, 'THIRD': 199, 'NORTHERN': 200, 'MEANS': 201, 'BUSINESSES': 202, 'CONFLICT': 203,
'DIFFICULT': 204, 'SCOTTISH': 205, 'THINK': 206, 'TOMORROW': 207, 'EVENTS': 208, 'MINISTERS': 209, 'COURSE': 210,
'BETWEEN': 211, 'ASKED': 212, 'EVERYTHING': 213, 'ARRESTED': 214, 'BUDGET': 215, 'OPPOSITION': 216, 'WEATHER': 217,
'PLACE': 218, 'POWER': 219, 'WORDS': 220, 'SMALL': 221, 'COULD': 222, 'DESPITE': 223, 'LABOUR': 224, 'RUNNING': 225,
'CONTROL': 226, 'POTENTIAL': 227, 'IRELAND': 228, 'HOUSE': 229, 'FINANCIAL': 230, 'MATTER': 231, 'THOSE': 232,
'COMPANY': 233, 'RUSSIA': 234, 'ENERGY': 235, 'GEORGE': 236, 'WITHOUT': 237, 'STATES': 238, 'LEAST': 239, 'SUPPORT': 240,
'EVERYBODY': 241, 'UNDER': 242, 'CURRENT': 243, 'PRISON': 244, 'HAVING': 245, 'DECIDED': 246, 'DEBATE': 247, 'HOMES': 248,
'EXPECTED': 249, 'PROBLEM': 250, 'STATEMENT': 251, 'FIRST': 252, 'BETTER': 253, 'POLICE': 254, 'FOUND': 255, 'SYSTEM': 256,
'AFTER': 257, 'MURDER': 258, 'BUILDING': 259, 'JUDGE': 260, 'PERHAPS': 261, 'REASON': 262, 'PROTECT': 263, 'EUROPE': 264,
'ACTION': 265, 'TRUST': 266, 'MOVING': 267, 'QUITE': 268, 'SAYING': 269, 'PRICE': 270, 'FORMER': 271, 'THREE': 272,
'BEFORE': 273, 'THEIR': 274, 'GROUP': 275, 'LEADERS': 276, 'EDUCATION': 277, 'BELIEVE': 278, 'HEARD': 279,
'IMMIGRATION': 280, 'CAMPAIGN': 281, 'LIKELY': 282, 'THESE': 283, 'CONSERVATIVE': 284, 'CHIEF': 285, 'SPEECH': 286,
'PEOPLE': 287, 'PARTS': 288, 'LONDON': 289, 'THERE': 290, 'HUNDREDS': 291, 'OFTEN': 292, 'COUPLE': 293, 'GAMES': 294,
'PROBABLY': 295, 'WHOLE': 296, 'GIVING': 297, 'CASES': 298, 'FAMILY': 299, 'MONEY': 300, 'BEING': 301, 'BANKS': 302,
'FOCUS': 303, 'TOGETHER': 304, 'GERMANY': 305, 'ACTUALLY': 306, 'CONCERNS': 307, 'VOTERS': 308, 'WOMEN': 309, 'STATE': 310,
'PROBLEMS': 311, 'TODAY': 312, 'SECOND': 313, 'INFLATION': 314, 'HAPPENED': 315, 'TRIAL': 316, 'SCHOOL': 317, 'DEATH': 318,
'TONIGHT': 319, 'MEMBER': 320, 'FINAL': 321, 'ATTACK': 322, 'OUTSIDE': 323, 'THOUSANDS': 324, 'EVERY': 325, 'COMING': 326,
'BRING': 327, 'GROWING': 328, 'ACCUSED': 329, 'ISSUES': 330, 'POLITICAL': 331, 'OFFICERS': 332, 'JAMES': 333, 'YEARS': 334,
'PARLIAMENT': 335, 'WESTMINSTER': 336, 'EASTERN': 337, 'MAYBE': 338, 'HOUSING': 339, 'MEMBERS': 340, 'HIGHER': 341,
'MESSAGE': 342, 'OBAMA': 343, 'STAGE': 344, 'CENTRAL': 345, 'EXTRA': 346, 'PARTY': 347, 'THING': 348, 'ABUSE': 349,
'POSSIBLE': 350, 'LEGAL': 351, 'INVESTMENT': 352, 'ECONOMIC': 353, 'POWERS': 354, 'WHERE': 355, 'DECISION': 356,
'SOUTHERN': 357, 'GIVEN': 358, 'REPORT': 359, 'FURTHER': 360, 'MAJORITY': 361, 'WITHIN': 362, 'COURT': 363, 'SECURITY': 364,
'CLAIMS': 365, 'WELFARE': 366, 'EARLY': 367, 'MILITARY': 368, 'INTEREST': 369, 'MIGHT': 370, 'CALLED': 371, 'PHONE': 372,
'WESTERN': 373, 'INDEPENDENT': 374, 'LIVING': 375, 'RIGHT': 376, 'SPENDING': 377, 'PRETTY': 378, 'BEHIND': 379,
'ALREADY': 380, 'ATTACKS': 381, 'MISSING': 382, 'BRITISH': 383, 'SIDES': 384, 'POLICY': 385, 'YOUNG': 386, 'BENEFITS': 387,
'START': 388, 'PRESIDENT': 389, 'SINCE': 390, 'CHARGES': 391, 'SENIOR': 392, 'SOCIAL': 393, 'GREECE': 394, 'LOCAL': 395,
'YESTERDAY': 396, 'AMONG': 397, 'CHILD': 398, 'TALKS': 399, 'MAJOR': 400, 'WHETHER': 401, 'FIGHTING': 402, 'GROWTH': 403,
'PROVIDE': 404, 'SEVEN': 405, 'ANSWER': 406, 'UNTIL': 407, 'ACROSS': 408, 'MIGRANTS': 409, 'REPORTS': 410, 'FOLLOWING': 411,
'PERIOD': 412, 'SUNDAY': 413, 'BILLION': 414, 'WINDS': 415, 'COUNTRIES': 416, 'SHOULD': 417, 'SPEAKING': 418, 'REALLY': 419,
'WANTED': 420, 'SPECIAL': 421, 'IMPORTANT': 422, 'ITSELF': 423, 'USING': 424, 'WORKERS': 425, 'ACCORDING': 426,
'ENGLAND': 427, 'HISTORY': 428, 'BORDER': 429, 'CHALLENGE': 430, 'BROUGHT': 431, 'SIGNIFICANT': 432, 'ALLEGATIONS': 433,
'NEEDS': 434, 'RESULT': 435, 'ALLOW': 436, 'MOMENT': 437, 'PRESSURE': 438, 'GLOBAL': 439, 'THOUGHT': 440, 'SEVERAL': 441,
'QUESTION': 442, 'CLEAR': 443, 'HAPPEN': 444, 'PERSON': 445, 'PRIVATE': 446, 'POSITION': 447, 'ALLOWED': 448, 'RULES': 449,
'SOMEONE': 450, 'SERIES': 451, 'THEMSELVES': 452, 'ALWAYS': 453, 'CONTINUE': 454, 'MONTHS': 455, 'INFORMATION': 456,
'THREAT': 457, 'SOCIETY': 458, 'STRONG': 459, 'OFFICIALS': 460, 'EUROPEAN': 461, 'FRIDAY': 462, 'CRISIS': 463,
'GOVERNMENT': 464, 'COMMUNITY': 465, 'AFFECTED': 466, 'MILLIONS': 467, 'ABOUT': 468, 'DEFICIT': 469, 'IMPACT': 470,
'ACCESS': 471, 'BUSINESS': 472, 'THROUGH': 473, 'DURING': 474, 'EDITOR': 475, 'FORCES': 476, 'RECORD': 477, 'LEAVE': 478,
'BLACK': 479, 'LEADERSHIP': 480, 'TIMES': 481, 'UNITED': 482, 'WORST': 483, 'LOOKING': 484, 'THINGS': 485, 'ALMOST': 486,
'SPENT': 487, 'HUMAN': 488, 'SERVICES': 489, 'KILLED': 490, 'DIFFERENCE': 491, 'DEGREES': 492, 'AGREEMENT': 493,
'TRADE': 494, 'AROUND': 495, 'KNOWN': 496, 'NUMBER': 497, 'PLACES': 498, 'AREAS': 499}
datadir = "/home/yxwang/Dataset/LRW"
# split = "train" # train val test
train = []
val = []
test = []
for root, ds, fs in os.walk(datadir):
for f in fs:
if ".mp4" in f:
split = root.split("/")
gt = split[-2]
split = split[-1]
eval(split).append(f"{root}/{f} {CATEGORY[gt]}\n")
with open(datadir+"/videoMAE_train.csv",'w') as f:
f.writelines(train)
with open(datadir+"/videoMAE_val.csv",'w') as f:
f.writelines(val)
with open(datadir+"/videoMAE_test.csv",'w') as f:
f.writelines(test)