File size: 1,619 Bytes
73ed896
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
VGGSound:
  root: ../data/video
  subset_name: sets/vgg3-train.tsv
  fps: 8
  height: 384
  width: 384
  sample_duration_sec: 8.0

VGGSound_test:
  root: ../data/video
  subset_name: sets/vgg3-test.tsv
  fps: 8
  height: 384
  width: 384
  sample_duration_sec: 8.0

VGGSound_val:
  root: ../data/video
  subset_name: sets/vgg3-val.tsv
  fps: 8
  height: 384
  width: 384
  sample_duration_sec: 8.0

ExtractedVGG:
  tsv: ../data/v1-16-memmap/vgg-train.tsv
  memmap_dir: ../data/v1-16-memmap/vgg-train

ExtractedVGG_test:
  tag: test
  gt_cache: ../data/eval-cache/vggsound-test
  output_subdir: null
  tsv: ../data/v1-16-memmap/vgg-test.tsv
  memmap_dir: ../data/v1-16-memmap/vgg-test

ExtractedVGG_val:
  tag: val
  gt_cache: ../data/eval-cache/vggsound-val
  output_subdir: val
  tsv: ../data/v1-16-memmap/vgg-val.tsv
  memmap_dir: ../data/v1-16-memmap/vgg-val

AudioCaps:
  tsv: ../data/v1-16-memmap/audiocaps.tsv
  memmap_dir: ../data/v1-16-memmap/audiocaps

AudioSetSL:
  tsv: ../data/v1-16-memmap/audioset_sl.tsv
  memmap_dir: ../data/v1-16-memmap/audioset_sl

BBCSound:
  tsv: ../data/v1-16-memmap/bbcsound.tsv
  memmap_dir: ../data/v1-16-memmap/bbcsound

FreeSound:
  tsv: ../data/v1-16-memmap/freesound.tsv
  memmap_dir: ../data/v1-16-memmap/freesound

Clotho:
  tsv: ../data/v1-16-memmap/clotho.tsv
  memmap_dir: ../data/v1-16-memmap/clotho

Example_video:
  tsv: ./training/example_output/memmap/vgg-example.tsv
  memmap_dir: ./training/example_output/memmap/vgg-example

Example_audio:
  tsv: ./training/example_output/memmap/audio-example.tsv
  memmap_dir: ./training/example_output/memmap/audio-example