parent
							
								
									5880487d27
								
							
						
					
					
						commit
						0e9845b69a
					
				|  | @ -106,7 +106,7 @@ grep -Fx -f "top-1m-well-known.txt" > "phishing-top-domains.txt" | |||
| 
 | ||||
| ## Exclude popular domains | ||||
| cat "phishing-domains.txt" | \ | ||||
| grep -F -vf "phishing-top-domains.txt" > "phishing-notop-domains.txt" | ||||
| grep -F -vf "phishing-top-domains.txt" > "phishing-notop-domains-temp.txt" | ||||
| 
 | ||||
| cat "phishing.txt" | \ | ||||
| grep -F -f "phishing-top-domains.txt" > "phishing-url-top-domains-temp.txt" | ||||
|  | @ -122,7 +122,8 @@ while read URL; do | |||
| 
 | ||||
|   ## Separate host-only URL | ||||
|   if [ -z "$URI" ] || [ "$URI" = "/" ]; then | ||||
|     echo "$HOST" >> "phishing-notop-domains.txt" | ||||
|     echo "$HOST" | \ | ||||
|     cut -f 1 -d ":" >> "phishing-notop-domains-temp.txt" | ||||
|   else | ||||
|     ## Parse phishing URLs from popular domains | ||||
|     echo "$URL" | \ | ||||
|  | @ -134,6 +135,9 @@ done < "phishing-url-top-domains-temp.txt" | |||
| ## Re-enable command print | ||||
| set -x | ||||
| 
 | ||||
| ## "phishing-url-top-domains-temp.txt" may add duplicate entries | ||||
| sort -u "phishing-notop-domains-temp.txt" > "phishing-notop-domains.txt" | ||||
| 
 | ||||
| 
 | ||||
| ## Merge malware domains and URLs | ||||
| CURRENT_TIME="$(date -R -u)" | ||||
|  |  | |||
		Loading…
	
		Reference in New Issue