-
Notifications
You must be signed in to change notification settings - Fork 15
/
cleaner.go
138 lines (123 loc) · 4.51 KB
/
cleaner.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
package subtitles
import (
"fmt"
"strings"
"time"
"github.com/fatih/color"
)
// ResyncSubs adjust text timing by `sync` milliseconds
func (subtitle *Subtitle) ResyncSubs(sync int) {
// log.Printf("resyncing with %d\n", sync)
for i := range subtitle.Captions {
subtitle.Captions[i].Start = subtitle.Captions[i].Start.
Add(time.Duration(sync) * time.Millisecond)
subtitle.Captions[i].End = subtitle.Captions[i].End.
Add(time.Duration(sync) * time.Millisecond)
}
}
var (
advertisements = []string{
// english:
"captions paid for by",
"english subtitles",
"subtitles -", "subtitles:", "subtitles by",
"subtitles downloaded",
"captioning by", "captions by", "captioning made possible by",
"mtv network", "turner entertainment group", "fox broadcasting",
"carsey-werner", "red bee media",
"transcript :", "transcript:", "transcript by",
"sync, corrected", "synced and corrected",
"sync and corrected", "sync & correction",
"sync and corrections",
"traduction:", "transcript par",
"corrections by", "corrected by",
"n17t01", "vnaru", "honeybunny", "sp8ky", "susanalc", "f1nc0", "euroeuro",
"skmatt",
"synchro :", "synchro:", "synced by", "synchronized by",
"synchronization by", "synchronisation:",
"resynchronization:",
"resync:", "resynchro", "resync by",
"translation by",
"encoded by",
"downloaded from",
"web-dl", "xvid",
"subscene", "podnapisi", "bokutox", "team nanban",
"fury_don@hotmail.com",
"broadcasttext",
"seriessub", "subtitlesource",
"addic7ed", "addicted.com", "vaioholics",
"sdimedia", "sdi media",
"allsubs.org", "hdbits.org", "bierdopje.com", "subcentral", "mkvcage",
"cssubs", "tvsub", "uksubtitles",
"ragbear.com", "ydy.com", "yyets.net", "indivx.net", "sub-way.fr",
"forom.com", "forom. com", "facebook.com", "hdvietnam.com", "sapo.pt", "softhome.net",
"americascardroom.com", "subti.com", "tugazx", "pirata-tuga",
"napisy.org", "1000fr.com", "yts.mx", "yts.am", "yts.ag", "yts.lt",
"opensubtitles", "open subtitles", "s u b t i t l e",
"sous-titres.eu", "300mbfilms.com", "put.io", "subtitulos.es", "osdb.link", "300mbunited",
"simail.si", "sf-film.dk", "sf.net", "vitac.com", "rapidpremium", "psarips",
"yify-torrents", "yify torrents", "yify movies",
"thepiratebay", "anoxmous", "verdikt", "la fisher team", "red bee media",
"mkv player", "mkv-potplayer-vlc", "best watched using", "best play with",
"advertise your product", "remove all ads",
"memoryonsmells", "1st-booking",
":[gwc]:", "ripped with subrip", "titra film",
"hiqve", "kentir.bb", "w-bb.org", "sub download",
"trimark home video",
"captionmax", "southparknews",
"national captioning institute",
// swedish:
"swedish subtitles", "svenska undertexter", "internationella undertexter",
"svensktextning", "(c) sveriges televisionit", "sveriges television ab",
"undertexter.se", "undertexter. se", "swesub.nu", "divxsweden", "undertext.com", "undertext.se",
"undertext av", "översatt av", "översättning:", "översättning av", "rättad av",
"synkad av", "synkat av", "synk:", "synkning:", "redigerad av", "textning:",
"svensk text", "text:", "omsynk:", "omsynkad",
"transkribering:", "piratpartiet.se",
"korrektur:", "korrekturläst", "texter på nätet", "text hämtad från",
"din filmsajt på nätet", "din största filmsajt på nätet",
"alltid nya texter",
"senaste undertexter på",
"programtextning", "översättargrupp",
"mediatextgruppen", "visiontext", "scandinavian text service",
"jhs International", "svensk medietext",
// norweigan:
"norsk tekst:", "norske tekster:",
// danish:
"oversættelse:", "tekster:",
// finnish:
"suomennos:",
// french:
"relecture et corrections finales:", "sous-titres par", "el uploador",
}
)
// RemoveAds removes advertisement from the subtitles
func (subtitle *Subtitle) RemoveAds(outputPrefix string, verbose bool) *Subtitle {
info := color.New(color.FgGreen, color.BgBlack).SprintFunc()
orange := color.New(color.FgBlack, color.BgHiYellow).SprintFunc()
seq := 1
res := []Caption{}
for orgSeq, sub := range subtitle.Captions {
isAd := false
block := ""
for _, line := range sub.Text {
block += strings.ToLower(line) + " "
}
for _, adLine := range advertisements {
if !isAd && strings.Contains(block, adLine) {
isAd = true
if verbose {
fmt.Printf("%s [ads] %d %s matched (%s)\n", info(outputPrefix), (orgSeq + 1), orange(sub.Text), adLine)
}
break
}
}
if !isAd {
sub.Seq = seq
res = append(res, sub)
seq++
}
}
subtitle.Captions = res
return subtitle
}