httpz- Hyper-fast HTTP Scraping Tool |
git clone git://git.acid.vegas/httpz.git |
Log | Files | Refs | Archive | README | LICENSE |
cli.py (7109B)
1 #!/usr/bin/env python3 2 # HTTPZ Web Scanner - Developed by acidvegas in Python (https://github.com/acidvegas/httpz) 3 # httpz/cli.py 4 5 import argparse 6 import asyncio 7 import logging 8 import os 9 import sys 10 11 from .colors import Colors 12 from .scanner import HTTPZScanner 13 from .utils import SILENT_MODE, info 14 15 def setup_logging(level='INFO', log_to_disk=False): 16 ''' 17 Setup logging configuration 18 19 :param level: Logging level (INFO or DEBUG) 20 :param log_to_disk: Whether to also log to file 21 ''' 22 class ColoredFormatter(logging.Formatter): 23 def formatTime(self, record, datefmt=None): 24 # Format: MM-DD HH:MM 25 from datetime import datetime 26 dt = datetime.fromtimestamp(record.created) 27 return f"{Colors.GRAY}{dt.strftime('%m-%d %H:%M')}{Colors.RESET}" 28 29 def format(self, record): 30 return f'{self.formatTime(record)} {record.getMessage()}' 31 32 handlers = [] 33 34 # Console handler 35 console = logging.StreamHandler() 36 console.setFormatter(ColoredFormatter()) 37 handlers.append(console) 38 39 # File handler 40 if log_to_disk: 41 os.makedirs('logs', exist_ok=True) 42 file_handler = logging.FileHandler(f'logs/httpz.log') 43 file_handler.setFormatter(logging.Formatter('%(asctime)s - %(levelname)s - %(message)s')) 44 handlers.append(file_handler) 45 46 # Setup logger 47 logging.basicConfig( 48 level=getattr(logging, level.upper()), 49 handlers=handlers 50 ) 51 52 def parse_status_codes(codes_str: str) -> set: 53 ''' 54 Parse comma-separated status codes and ranges into a set of integers 55 56 :param codes_str: Comma-separated status codes (e.g., "200,301-399,404,500-503") 57 ''' 58 59 codes = set() 60 try: 61 for part in codes_str.split(','): 62 if '-' in part: 63 start, end = map(int, part.split('-')) 64 codes.update(range(start, end + 1)) 65 else: 66 codes.add(int(part)) 67 return codes 68 except ValueError: 69 raise argparse.ArgumentTypeError('Invalid status code format. Use comma-separated numbers or ranges (e.g., 200,301-399,404,500-503)') 70 71 async def main(): 72 parser = argparse.ArgumentParser( 73 description=f'{Colors.GREEN}Hyper-fast HTTP Scraping Tool{Colors.RESET}', 74 formatter_class=argparse.RawDescriptionHelpFormatter 75 ) 76 77 # Add arguments 78 parser.add_argument('file', nargs='?', default='-', help='File containing domains to check (one per line), use - for stdin') 79 parser.add_argument('-all', '--all-flags', action='store_true', help='Enable all output flags') 80 parser.add_argument('-d', '--debug', action='store_true', help='Show error states and debug information') 81 parser.add_argument('-c', '--concurrent', type=int, default=100, help='Number of concurrent checks') 82 parser.add_argument('-j', '--jsonl', action='store_true', help='Output JSON Lines format to console') 83 parser.add_argument('-o', '--output', help='Output file path (JSONL format)') 84 85 # Output field flags 86 parser.add_argument('-b', '--body', action='store_true', help='Show body preview') 87 parser.add_argument('-cn', '--cname', action='store_true', help='Show CNAME records') 88 parser.add_argument('-cl', '--content-length', action='store_true', help='Show content length') 89 parser.add_argument('-ct', '--content-type', action='store_true', help='Show content type') 90 parser.add_argument('-f', '--favicon', action='store_true', help='Show favicon hash') 91 parser.add_argument('-fr', '--follow-redirects', action='store_true', help='Follow redirects (max 10)') 92 parser.add_argument('-hr', '--headers', action='store_true', help='Show response headers') 93 parser.add_argument('-i', '--ip', action='store_true', help='Show IP addresses') 94 parser.add_argument('-sc', '--status-code', action='store_true', help='Show status code') 95 parser.add_argument('-ti', '--title', action='store_true', help='Show page title') 96 parser.add_argument('-tls', '--tls-info', action='store_true', help='Show TLS certificate information') 97 98 # Other arguments 99 parser.add_argument('-ax', '--axfr', action='store_true', help='Try AXFR transfer against nameservers') 100 parser.add_argument('-ec', '--exclude-codes', type=parse_status_codes, help='Exclude these status codes (comma-separated, e.g., 404,500)') 101 parser.add_argument('-mc', '--match-codes', type=parse_status_codes, help='Only show these status codes (comma-separated, e.g., 200,301,404)') 102 parser.add_argument('-p', '--progress', action='store_true', help='Show progress counter') 103 parser.add_argument('-r', '--resolvers', help='File containing DNS resolvers (one per line)') 104 parser.add_argument('-to', '--timeout', type=int, default=5, help='Request timeout in seconds') 105 106 args = parser.parse_args() 107 108 # Setup logging based on arguments 109 global SILENT_MODE 110 SILENT_MODE = args.jsonl 111 112 if not SILENT_MODE: 113 if args.debug: 114 setup_logging(level='DEBUG', log_to_disk=True) 115 else: 116 setup_logging(level='INFO') 117 118 if args.file == '-': 119 info('Reading domains from stdin') 120 else: 121 info(f'Processing file: {args.file}') 122 123 # Setup show_fields 124 show_fields = { 125 'status_code' : args.all_flags or args.status_code, 126 'content_type' : args.all_flags or args.content_type, 127 'content_length' : args.all_flags or args.content_length, 128 'title' : args.all_flags or args.title, 129 'body' : args.all_flags or args.body, 130 'ip' : args.all_flags or args.ip, 131 'favicon' : args.all_flags or args.favicon, 132 'headers' : args.all_flags or args.headers, 133 'follow_redirects' : args.all_flags or args.follow_redirects, 134 'cname' : args.all_flags or args.cname, 135 'tls' : args.all_flags or args.tls_info 136 } 137 138 # If no fields specified show all 139 if not any(show_fields.values()): 140 show_fields = {k: True for k in show_fields} 141 142 try: 143 # Create scanner instance 144 scanner = HTTPZScanner( 145 concurrent_limit=args.concurrent, 146 timeout=args.timeout, 147 follow_redirects=args.all_flags or args.follow_redirects, 148 check_axfr=args.axfr, 149 resolver_file=args.resolvers, 150 output_file=args.output, 151 show_progress=args.progress, 152 debug_mode=args.debug, 153 jsonl_output=args.jsonl, 154 show_fields=show_fields, 155 match_codes=args.match_codes, 156 exclude_codes=args.exclude_codes 157 ) 158 159 # Run the scanner with file/stdin input 160 await scanner.scan(args.file) 161 162 except KeyboardInterrupt: 163 logging.warning('Process interrupted by user') 164 sys.exit(1) 165 except Exception as e: 166 logging.error(f'Unexpected error: {str(e)}') 167 sys.exit(1) 168 169 def run(): 170 '''Entry point for the CLI''' 171 asyncio.run(main()) 172 173 if __name__ == '__main__': 174 run()