-
Notifications
You must be signed in to change notification settings - Fork 8
/
rarbg.go
259 lines (233 loc) · 8.54 KB
/
rarbg.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
package imdb2torrent
import (
"context"
"fmt"
"io/ioutil"
"net/http"
"strconv"
"strings"
"sync"
"time"
"github.com/tidwall/gjson"
"go.uber.org/zap"
)
type RARBGclientOptions struct {
// Typically "https://torrentapi.org"
BaseURL string
Timeout time.Duration
CacheAge time.Duration
}
func NewRARBGclientOpts(baseURL string, timeout, cacheAge time.Duration) RARBGclientOptions {
return RARBGclientOptions{
BaseURL: baseURL,
Timeout: timeout,
CacheAge: cacheAge,
}
}
var DefaultRARBGclientOpts = RARBGclientOptions{
BaseURL: "https://torrentapi.org",
Timeout: 5 * time.Second,
CacheAge: 24 * time.Hour,
}
var _ MagnetSearcher = (*rarbgClient)(nil)
type rarbgClient struct {
baseURL string
httpClient *http.Client
cache Cache
cacheAge time.Duration
logger *zap.Logger
logFoundTorrents bool
token string
tokenExpired func() bool
lastRequest time.Time
lock *sync.Mutex
}
func NewRARBGclient(opts RARBGclientOptions, cache Cache, logger *zap.Logger, logFoundTorrents bool) *rarbgClient {
return &rarbgClient{
baseURL: opts.BaseURL,
httpClient: &http.Client{
Timeout: opts.Timeout,
},
cache: cache,
cacheAge: opts.CacheAge,
logger: logger,
logFoundTorrents: logFoundTorrents,
tokenExpired: func() bool { return true },
lock: &sync.Mutex{},
}
}
// FindMovie uses RARBG's API to find torrents for the given IMDb ID.
// If no error occured, but there are just no torrents for the movie yet, an empty result and *no* error are returned.
func (c *rarbgClient) FindMovie(ctx context.Context, imdbID string) ([]Result, error) {
escapedQuery := "search_imdb=" + imdbID
return c.find(ctx, imdbID, escapedQuery)
}
// FindTVShow uses RARBG's API to find torrents for the given IMDb ID + season + episode.
// If no error occured, but there are just no torrents for the TV show yet, an empty result and *no* error are returned.
func (c *rarbgClient) FindTVShow(ctx context.Context, imdbID string, season, episode int) ([]Result, error) {
seasonString := strconv.Itoa(season)
episodeString := strconv.Itoa(episode)
id := imdbID + ":" + seasonString + ":" + episodeString
// RARBG / torrentapi supports TV show search via IMDBb ID, even (and only) via the show's IMDb,
// AND allows us to additionally filter by name, so we can filter for the season + episode here! Nice!
if season < 10 {
seasonString = "0" + seasonString
}
if episode < 10 {
episodeString = "0" + episodeString
}
escapedQuery := "search_imdb=" + imdbID + "&search_string=S" + seasonString + "E" + episodeString
return c.find(ctx, id, escapedQuery)
}
// Query must be URL-escaped already.
func (c *rarbgClient) find(ctx context.Context, id, escapedQuery string) ([]Result, error) {
zapFieldID := zap.String("id", id)
zapFieldTorrentSite := zap.String("torrentSite", "RARBG")
// Check cache first
cacheKey := id + "-RARBG"
torrentList, created, found, err := c.cache.Get(cacheKey)
if err != nil {
c.logger.Error("Couldn't get torrent results from cache", zap.Error(err), zapFieldID, zapFieldTorrentSite)
} else if !found {
c.logger.Debug("Torrent results not found in cache", zapFieldID, zapFieldTorrentSite)
} else if time.Since(created) > (c.cacheAge) {
expiredSince := time.Since(created.Add(c.cacheAge))
c.logger.Debug("Hit cache for torrents, but item is expired", zap.Duration("expiredSince", expiredSince), zapFieldID, zapFieldTorrentSite)
} else {
c.logger.Debug("Hit cache for torrents, returning results", zap.Int("torrentCount", len(torrentList)), zapFieldID, zapFieldTorrentSite)
return torrentList, nil
}
// Check token expiration
if c.tokenExpired() {
if err = c.RefreshToken(); err != nil {
c.logger.Error("Couldn't refresh token", zap.Error(err), zapFieldID, zapFieldTorrentSite)
return nil, nil
}
}
// Prevent concurrent requests *and* wait for 2 seconds to pass if necessary, so we don't hit the rate limit
c.lock.Lock()
time.Sleep(2*time.Second - time.Since(c.lastRequest))
defer func() {
c.lock.Unlock()
c.lastRequest = time.Now()
}()
// `format=json_extended` for size info
url := c.baseURL + "/pubapi_v2.php?app_id=deflix&mode=search&sort=seeders&format=json_extended&ranked=0&token=" + c.token + "&" + escapedQuery
req, err := http.NewRequest("GET", url, nil)
if err != nil {
return nil, fmt.Errorf("Couldn't create request: %v", err)
}
// For one and the same IMDb ID, RARBG sometimes returns results, sometimes a JSON saying that no result was found.
// The rate of success is higher with cURL, and very low when doing `c.httpClient.Get(url)`, so we're trying to identify as cURL.
req.Header.Set("User-Agent", "curl/7.47.0")
req.Header.Set("Accept", "*/*")
res, err := c.httpClient.Do(req)
if err != nil {
return nil, fmt.Errorf("Couldn't GET %v: %v", url, err)
}
defer res.Body.Close()
if res.StatusCode != http.StatusOK {
return nil, fmt.Errorf("Bad GET response: %v", res.StatusCode)
}
resBody, err := ioutil.ReadAll(res.Body)
if err != nil {
return nil, fmt.Errorf("Couldn't read response body: %v", err)
}
// Extract data from JSON
torrents := gjson.GetBytes(resBody, "torrent_results").Array()
if len(torrents) == 0 {
// Nil slice is ok, because it can be checked with len()
return nil, nil
}
var results []Result
for _, torrent := range torrents {
// Note: When using `format=json` or no format in the query, use "filename" here,
// otherwise (`format=json_extended`) use "title" here.
filename := torrent.Get("title").String()
quality := ""
if strings.Contains(filename, "720p") {
quality = "720p"
} else if strings.Contains(filename, "1080p") {
quality = "1080p"
} else if strings.Contains(filename, "2160p") {
quality = "2160p"
} else {
continue
}
magnet := torrent.Get("download").String()
// look for "btih:dd8255ecdc7ca55fb0bbf81323d87062db1f6d1c&" via regex and then cut out the hash
match := magnet2InfoHashRegex.Find([]byte(magnet))
infoHash := strings.TrimPrefix(string(match), "btih:")
infoHash = strings.TrimSuffix(infoHash, "&")
infoHash = strings.ToLower(infoHash)
if len(infoHash) != 40 {
c.logger.Error("InfoHash isn't 40 characters long", zap.String("magnet", magnet), zapFieldID, zapFieldTorrentSite)
continue
}
size := int(torrent.Get("size").Int())
seeders := int(torrent.Get("seeders").Int())
if c.logFoundTorrents {
c.logger.Debug("Found torrent", zap.String("quality", quality), zap.String("infoHash", infoHash), zap.String("magnet", magnet), zap.Int("size", size), zap.Int("seeders", seeders), zapFieldID, zapFieldTorrentSite)
}
result := Result{
Name: filename,
// We don't know the title, but it will be overwritten by the quality anyway
// Title: "",
Quality: quality,
InfoHash: infoHash,
MagnetURL: magnet,
Size: size,
Seeders: seeders,
}
results = append(results, result)
}
// Fill cache, even if there are no results, because that's just the current state of the torrent site.
// Any actual errors would have returned earlier.
if err := c.cache.Set(cacheKey, results); err != nil {
c.logger.Error("Couldn't cache torrents", zap.Error(err), zap.String("cache", "torrent"), zapFieldID, zapFieldTorrentSite)
}
return results, nil
}
func (c *rarbgClient) IsSlow() bool {
return true
}
func (c *rarbgClient) RefreshToken() error {
url := c.baseURL + "/pubapi_v2.php?app_id=deflix&get_token=get_token"
req, err := http.NewRequest("GET", url, nil)
if err != nil {
return fmt.Errorf("Couldn't create request object: %v", req)
}
// Prevent concurrent requests *and* wait for 2 seconds to pass if necessary, so we don't hit the rate limit
c.lock.Lock()
time.Sleep(2*time.Second - time.Since(c.lastRequest))
defer func() {
c.lock.Unlock()
c.lastRequest = time.Now()
}()
// After getting the lock, check expiry again (was already checked before RefreshToken() was called) to not send this request several times due to concurrent incoming requests after the token expired.
if !c.tokenExpired() {
return nil
}
res, err := c.httpClient.Do(req)
if err != nil {
return fmt.Errorf("Couldn't GET %v: %v", url, err)
}
defer res.Body.Close()
if res.StatusCode != http.StatusOK {
return fmt.Errorf("Bad GET response: %v", res.StatusCode)
}
resBody, err := ioutil.ReadAll(res.Body)
if err != nil {
return fmt.Errorf("Couldn't read response body: %v", err)
}
token := gjson.GetBytes(resBody, "token").String()
if token == "" {
return fmt.Errorf("Token is empty")
}
c.token = token
createdAt := time.Now()
c.tokenExpired = func() bool {
return time.Since(createdAt).Minutes() > 14
}
return nil
}