null, '*.mgr.consensu.org' => null, 'vs*.gzcu.u3.ucweb.com' => null, 'ad*.goforandroid.com' => null, 'bs*.9669.cn' => null, '*dnserror*.wo.com.cn' => null, '*mistat*.xiaomi.com' => null, 'affrh20*.com' => null, 'assoc-amazon.*' => null, 'clkservice*.youdao.com' => null, 'dsp*.youdao.com' => null, 'pussl*.com' => null, 'putrr*.com' => null, 'ad.*.360.cn' => null, 't*.a.market.xiaomi.com' => null, 'ad*.bigmir.net' => null, 'log*.molitv.cn' => null, 'adm*.autoimg.cn' => null, 'cloudservice*.kingsoft-office-service.com' => null, 'gg*.51cto.com' => null, 'log.*.hunantv.com' => null, '*.log.hunantv.com' => null, 'iflyad.*.openstorage.cn' => null, '*customstat*.51togic.com' => null, 'appcloud*.zhihu.com' => null, 'ad*.molitv.cn' => null, 'ads*-adnow.com' => null, 'aeros*.tk' => null, 'analyzer*.fc2.com' => null, 'admicro*.vcmedia.vn' => null, 'xn--xhq9mt12cf5v.*' => null, 'freecontent.*' => null, 'hostingcloud.*' => null, 'jshosting.*' => null, 'flightzy.*' => null, 'sunnimiq*.cf' => null, 'admob.*' => null, '*log.droid4x.cn' => null, '*tsdk.vivo.com.cn' => null, '*.mmstat.com' => null, 'sf*-ttcdn-tos.pstatp.com' => null, ); $ARR_REGEX_LIST = array( '/9377[a-z]{2}\.com$/' => null, '/^(\S+\.)?ad([\d]|m|s)?\./' => null, '/^(\S+\.)?affiliat(es|ion|e)\./' => null, '/afgr[\d]{1,2}\.com$/' => null, '/^(\S+\.)?analytics(\-|\.)/' => null, '/^(\S+\.)?counter(\-|\.)/' => null, '/^(\S+\.)?pixels?\./' => null, '/syma[a-z]\.cn$/' => null, '/^(\S+\.)?widgets?\./' => null, '/^(\S+\.)?(web)?stats?\./' => null, '/^(\S+\.)?track(ing)?\./' => null, '/^(\S+\.)?tongji\./' => null, '/^(\S+\.)?toolbar\./' => null, '/^(\S+\.)?adservice\.google\./' => null, '/^(\S+\.)?d[\d]+\.sina(img)?(\.com)?\.cn/' => null, '/^(\S+\.)?sax[\dns]?\.sina\.com\.cn/' => null, '/delivery([\d]{2}|dom|modo).com$/' => null, '/^(\S+\.)?[c-s]ads(abs|abz|ans|anz|ats|atz|del|ecs|ecz|ims|imz|ips|ipz|kis|kiz|oks|okz|one|pms|pmz)\.com/' => null, '/^([a-z\d\-]+\.)?(?!xn--)[^\.\/]{40,}\.(com|net|cn)(\.cn)?$/' => null, //超长域名 '/^(\S+\.)?11599[\da-z]{2,20}\.com$/' => null, //"澳门新葡京"系列 '/^(\S+\.)?61677[\da-z]{0,20}\.com$/' => null, //"澳门新葡京"系列 // '/^(\S+\.)?(?=.*[a-f].*\.com$)(?=.*\d.*\.com$)[a-f0-9]{15,}\.com$/' => null, ); //对通配符匹配或正则匹配增加的额外赦免规则 $ARR_WHITE_RULE_LIST = array( '@@||tongji.*kuwo.cn^' => 0, // '@@||ntp.org^' => 1, //强制加白,针对上面正则表达式的一个赦免规则,例如:2.android.pool.ntp.org // '@@||*push-apple.com.akadns.net^' => 1, //强制加白, 苹果推送2.courier-push-apple.com.akadns.net '@@||tracking.epicgames.com^' => 0, '@@||tracker.eu.org^' => 1, //强制加白,BT tracker,有形如2.tracker.eu.org的域 '@@||stats.uptimerobot.com^' => 0, //uptimerobot监测相关 '@@||track.sendcloud.org^' => 0, //邮件退订域名 '@@||log.mmstat.com^' => 0, //修复优酷视频显示禁用了cookie '@@||adm.10jqka.com.cn^' => 0, //同花顺 '@@||center-h5api.m.taobao.com^' => 1, //h5页面 '@@||app.adjust.com^' => 1, //https://github.com/AdguardTeam/AdGuardSDNSFilter/pull/186 ); //针对上游赦免规则anti-AD不予赦免的规则,即赦免名单的黑名单 $ARR_WHITE_RULE_BLK_LIST = array( '@@||ads.nipr.ac.jp^' => null, ); //针对上游通配符规则中anti-AD不予采信的规则,即通配符黑名单 $ARR_WILD_BLK_LIST = array( 'cnt*rambler.ru' => null, 'um*.com' => null, ); if(PHP_SAPI != 'cli'){ die('nothing.'); } $src_file = ''; try{ $file = $argv[1]; $src_file = ROOT_DIR . $file; }catch(Exception $e){ echo "get args failed.", $e->getMessage(), "\n"; die(0); } if(empty($src_file) || !is_file($src_file)){ echo 'src_file:', $src_file, ' is not found.'; die(0); } if(!is_file(WILDCARD_SRC) || !is_file(WHITERULE_SRC)){ echo 'key file is not found.'; die(0); } $src_fp = fopen($src_file, 'r'); $wild_fp = fopen(WILDCARD_SRC, 'r'); $new_fp = fopen($src_file . '.txt', 'w'); $wrote_wild = array(); $arr_wild_src = array(); while(!feof($wild_fp)){ $wild_row = fgets($wild_fp, 512); if(empty($wild_row)){ continue; } if(!preg_match('/^\|\|?([\w\-\.\*]+?)\^(\$([^=]+?,)?(image|third-party|script)(,[^=]+)?)?$/', $wild_row, $matches)){ continue; } if(array_key_exists($matches[1], $ARR_WILD_BLK_LIST)){ continue; } $matched = false; foreach($ARR_REGEX_LIST as $regex_str => $regex_row){ if(preg_match($regex_str, str_replace('*', '',$matches[1]))){ $matched = true; } } if($matched){ continue; } $arr_wild_src[$matches[1]] = $wild_row; } fclose($wild_fp); $arr_wild_src = array_merge($arr_wild_src, $ARR_MERGED_WILD_LIST); $insert_pos = $written_size = $line_count = 0; while(!feof($src_fp)){ $row = fgets($src_fp, 512); if(empty($row)){ continue; } if(($row{0} === '!') && (substr($row, 0, 13) === '!TOTAL_LINES=')){ $insert_pos = $written_size; } if(!preg_match('/^\|.+?/', $row)){ $written_size += fwrite($new_fp, $row); continue; } $matched = false; foreach($ARR_REGEX_LIST as $regex_str => $regex_row){ if(preg_match($regex_str, substr(trim($row), 2, -1))){ $matched = true; if(!array_key_exists($regex_str, $wrote_wild)){ $written_size += fwrite($new_fp, "${regex_str}\n"); $line_count++; $wrote_wild[$regex_str] = 1; } } } if($matched){ continue; } foreach($arr_wild_src as $core_str => $wild_row){ $match_rule = str_replace('*', '.*', $core_str); if(!array_key_exists($core_str, $wrote_wild)){ $written_size += fwrite($new_fp, "||${core_str}^\n"); $line_count++; $wrote_wild[$core_str] = 1; } if(preg_match("/\|${match_rule}/", $row)){ $matched = true; break; } } if($matched){ continue; } $written_size += fwrite($new_fp, $row); $line_count++; } //按需写入白名单规则 $wrote_whitelist = array(); $whiterule = file(WHITERULE_SRC, FILE_SKIP_EMPTY_LINES | FILE_IGNORE_NEW_LINES); $whiterule=array_fill_keys($whiterule, 0); $ARR_WHITE_RULE_LIST = array_merge($whiterule, $ARR_WHITE_RULE_LIST); foreach($ARR_WHITE_RULE_LIST as $row => $v){ if(empty($row) || $row{0} !== '@' || $row{1} !== '@'){ continue; } $matches = array(); if(!preg_match('/@@\|\|([0-9a-z\.\-\*]+?)\^/', $row, $matches)){ continue; } if(array_key_exists("@@||${matches[1]}^", $ARR_WHITE_RULE_BLK_LIST)){ continue; } if($v === 1){ $wrote_whitelist[$matches[1]] = null; fwrite($new_fp, "@@||${matches[1]}^\n"); $line_count++; continue; } foreach($wrote_wild as $core_str => $val){ if($core_str{0} === '/'){ $match_rule = $core_str; }else{ $match_rule = str_replace('*', '.*', $core_str); $match_rule = "/${match_rule}/"; } if(preg_match($match_rule, $matches[1])){ $domain = addressMaker::extract_main_domain($matches[1]); if(array_key_exists($domain, $black_domain_list) || (is_array($black_domain_list[$domain]) && in_array($matches[1], $black_domain_list[$domain])) ){ continue; } if(array_key_exists($matches[1], $wrote_whitelist)){ continue; } $wrote_whitelist[$matches[1]] = null; fwrite($new_fp, "@@||${matches[1]}^\n"); $line_count++; } } } if(($insert_pos > 0) && (fseek($new_fp, $insert_pos) === 0)){ fwrite($new_fp, "!TOTAL_LINES={$line_count}\n"); } fclose($src_fp); fclose($new_fp); rename($src_file . '.txt', $src_file); echo 'Time cost:', microtime(true) - START_TIME, "s, at ", date('m-d H:i:s'), "\n";