Highly-opinionated (ex-bullshit-free) MTPROTO proxy for Telegram. If you use v1.0 or upgrade broke you proxy, please read the chapter Version 2
您最多选择25个主题 主题必须以字母或数字开头,可以包含连字符 (-),并且长度不得超过35个字符

firehol.go 6.9KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343
  1. package ipblocklist
  2. import (
  3. "bufio"
  4. "context"
  5. "fmt"
  6. "io"
  7. "io/ioutil"
  8. "net"
  9. "net/http"
  10. "net/url"
  11. "os"
  12. "regexp"
  13. "strings"
  14. "sync"
  15. "time"
  16. "github.com/9seconds/mtg/v2/mtglib"
  17. "github.com/kentik/patricia"
  18. "github.com/kentik/patricia/bool_tree"
  19. "github.com/panjf2000/ants/v2"
  20. )
  21. const (
  22. fireholIPv4DefaultCIDR = 32
  23. fireholIPv6DefaultCIDR = 128
  24. )
  25. var fireholRegexpComment = regexp.MustCompile(`\s*#.*?$`)
  26. type Firehol struct {
  27. ctx context.Context
  28. ctxCancel context.CancelFunc
  29. logger mtglib.Logger
  30. rwMutex sync.RWMutex
  31. remoteURLs []string
  32. localFiles []string
  33. httpClient *http.Client
  34. workerPool *ants.Pool
  35. treeV4 *bool_tree.TreeV4
  36. treeV6 *bool_tree.TreeV6
  37. }
  38. func (f *Firehol) Contains(ip net.IP) bool {
  39. if ip == nil {
  40. return true
  41. }
  42. ip4 := ip.To4()
  43. f.rwMutex.RLock()
  44. defer f.rwMutex.RUnlock()
  45. if ip4 != nil {
  46. return f.containsIPv4(ip4)
  47. }
  48. return f.containsIPv6(ip.To16())
  49. }
  50. func (f *Firehol) containsIPv4(addr net.IP) bool {
  51. ip := patricia.NewIPv4AddressFromBytes(addr, 32)
  52. if ok, _, err := f.treeV4.FindDeepestTag(ip); ok && err == nil {
  53. return true
  54. }
  55. return false
  56. }
  57. func (f *Firehol) containsIPv6(addr net.IP) bool {
  58. ip := patricia.NewIPv6Address(addr, 128)
  59. if ok, _, err := f.treeV6.FindDeepestTag(ip); ok && err == nil {
  60. return true
  61. }
  62. return false
  63. }
  64. func (f *Firehol) Run(updateEach time.Duration) {
  65. ticker := time.NewTicker(updateEach)
  66. defer func() {
  67. ticker.Stop()
  68. select {
  69. case <-ticker.C:
  70. default:
  71. }
  72. }()
  73. if err := f.update(); err != nil {
  74. f.logger.WarningError("cannot update blocklist", err)
  75. }
  76. for {
  77. select {
  78. case <-f.ctx.Done():
  79. return
  80. case <-ticker.C:
  81. if err := f.update(); err != nil {
  82. f.logger.WarningError("cannot update blocklist", err)
  83. }
  84. }
  85. }
  86. }
  87. func (f *Firehol) Shutdown() {
  88. f.ctxCancel()
  89. }
  90. func (f *Firehol) update() error { // nolint: funlen, cyclop
  91. ctx, cancel := context.WithCancel(f.ctx)
  92. defer cancel()
  93. wg := &sync.WaitGroup{}
  94. wg.Add(len(f.remoteURLs) + len(f.localFiles))
  95. treeMutex := &sync.Mutex{}
  96. v4tree := bool_tree.NewTreeV4()
  97. v6tree := bool_tree.NewTreeV6()
  98. errorChan := make(chan error, 1)
  99. defer close(errorChan)
  100. for _, v := range f.localFiles {
  101. go func(filename string) {
  102. defer wg.Done()
  103. if err := f.updateLocalFile(ctx, filename, treeMutex, v4tree, v6tree); err != nil {
  104. cancel()
  105. f.logger.BindStr("filename", filename).WarningError("cannot update", err)
  106. select {
  107. case errorChan <- err:
  108. default:
  109. }
  110. }
  111. }(v)
  112. }
  113. for _, v := range f.remoteURLs {
  114. value := v
  115. f.workerPool.Submit(func() { // nolint: errcheck
  116. defer wg.Done()
  117. if err := f.updateRemoteURL(ctx, value, treeMutex, v4tree, v6tree); err != nil {
  118. cancel()
  119. f.logger.BindStr("url", value).WarningError("cannot update", err)
  120. select {
  121. case errorChan <- err:
  122. default:
  123. }
  124. }
  125. })
  126. }
  127. wg.Wait()
  128. select {
  129. case err := <-errorChan:
  130. return fmt.Errorf("cannot update trees: %w", err)
  131. default:
  132. }
  133. f.rwMutex.Lock()
  134. defer f.rwMutex.Unlock()
  135. f.treeV4 = v4tree
  136. f.treeV6 = v6tree
  137. return nil
  138. }
  139. func (f *Firehol) updateLocalFile(ctx context.Context, filename string,
  140. mutex sync.Locker,
  141. v4tree *bool_tree.TreeV4, v6tree *bool_tree.TreeV6) error {
  142. filefp, err := os.Open(filename)
  143. if err != nil {
  144. return fmt.Errorf("cannot open file: %w", err)
  145. }
  146. go func(ctx context.Context, closer io.Closer) {
  147. <-ctx.Done()
  148. closer.Close()
  149. }(ctx, filefp)
  150. defer filefp.Close()
  151. return f.updateTrees(mutex, filefp, v4tree, v6tree)
  152. }
  153. func (f *Firehol) updateRemoteURL(ctx context.Context, url string,
  154. mutex sync.Locker,
  155. v4tree *bool_tree.TreeV4, v6tree *bool_tree.TreeV6) error {
  156. req, err := http.NewRequestWithContext(ctx, http.MethodGet, url, nil)
  157. if err != nil {
  158. return fmt.Errorf("cannot build a request: %w", err)
  159. }
  160. resp, err := f.httpClient.Do(req) // nolint: bodyclose
  161. if err != nil {
  162. return fmt.Errorf("cannot request a remote URL %s: %w", url, err)
  163. }
  164. go func(ctx context.Context, closer io.Closer) {
  165. <-ctx.Done()
  166. closer.Close()
  167. }(ctx, resp.Body)
  168. defer func(rc io.ReadCloser) {
  169. io.Copy(ioutil.Discard, rc) // nolint: errcheck
  170. rc.Close()
  171. }(resp.Body)
  172. return f.updateTrees(mutex, resp.Body, v4tree, v6tree)
  173. }
  174. func (f *Firehol) updateTrees(mutex sync.Locker,
  175. reader io.Reader,
  176. v4tree *bool_tree.TreeV4,
  177. v6tree *bool_tree.TreeV6) error {
  178. scanner := bufio.NewScanner(reader)
  179. for scanner.Scan() {
  180. text := scanner.Text()
  181. text = fireholRegexpComment.ReplaceAllLiteralString(text, "")
  182. text = strings.TrimSpace(text)
  183. if text == "" {
  184. continue
  185. }
  186. ip, cidr, err := f.updateParseLine(text)
  187. if err != nil {
  188. return fmt.Errorf("cannot parse a line: %w", err)
  189. }
  190. if err := f.updateAddToTrees(ip, cidr, mutex, v4tree, v6tree); err != nil {
  191. return fmt.Errorf("cannot add a node to the tree: %w", err)
  192. }
  193. }
  194. if scanner.Err() != nil {
  195. return fmt.Errorf("cannot parse a response: %w", scanner.Err())
  196. }
  197. return nil
  198. }
  199. func (f *Firehol) updateParseLine(text string) (net.IP, uint, error) {
  200. _, ipnet, err := net.ParseCIDR(text)
  201. if err != nil {
  202. ipaddr := net.ParseIP(text)
  203. if ipaddr == nil {
  204. return nil, 0, fmt.Errorf("incorrect ip address %s", text)
  205. }
  206. ip4 := ipaddr.To4()
  207. if ip4 != nil {
  208. return ip4, fireholIPv4DefaultCIDR, nil
  209. }
  210. return ipaddr.To16(), fireholIPv6DefaultCIDR, nil
  211. }
  212. ones, _ := ipnet.Mask.Size()
  213. return ipnet.IP, uint(ones), nil
  214. }
  215. func (f *Firehol) updateAddToTrees(ip net.IP, cidr uint,
  216. mutex sync.Locker,
  217. v4tree *bool_tree.TreeV4, v6tree *bool_tree.TreeV6) error {
  218. mutex.Lock()
  219. defer mutex.Unlock()
  220. if ip.To4() != nil {
  221. addr := patricia.NewIPv4AddressFromBytes(ip, cidr)
  222. if _, _, err := v4tree.Set(addr, true); err != nil {
  223. return err // nolint: wrapcheck
  224. }
  225. } else {
  226. addr := patricia.NewIPv6Address(ip, cidr)
  227. if _, _, err := v6tree.Set(addr, true); err != nil {
  228. return err // nolint: wrapcheck
  229. }
  230. }
  231. return nil
  232. }
  233. func NewFirehol(logger mtglib.Logger, network mtglib.Network,
  234. downloadConcurrency uint,
  235. remoteURLs []string,
  236. localFiles []string) (*Firehol, error) {
  237. for _, v := range remoteURLs {
  238. parsed, err := url.Parse(v)
  239. if err != nil {
  240. return nil, fmt.Errorf("incorrect url %s: %w", v, err)
  241. }
  242. switch parsed.Scheme {
  243. case "http", "https":
  244. default:
  245. return nil, fmt.Errorf("unsupported url %s", v)
  246. }
  247. }
  248. for _, v := range localFiles {
  249. if stat, err := os.Stat(v); os.IsNotExist(err) || stat.IsDir() || stat.Mode().Perm()&0o400 == 0 {
  250. return nil, fmt.Errorf("%s is not a readable file", v)
  251. }
  252. }
  253. if downloadConcurrency == 0 {
  254. downloadConcurrency = 1
  255. }
  256. workerPool, _ := ants.NewPool(int(downloadConcurrency))
  257. ctx, cancel := context.WithCancel(context.Background())
  258. return &Firehol{
  259. ctx: ctx,
  260. ctxCancel: cancel,
  261. logger: logger.Named("firehol"),
  262. httpClient: network.MakeHTTPClient(nil),
  263. treeV4: bool_tree.NewTreeV4(),
  264. treeV6: bool_tree.NewTreeV6(),
  265. workerPool: workerPool,
  266. remoteURLs: remoteURLs,
  267. localFiles: localFiles,
  268. }, nil
  269. }