httpz

- Hyper-fast HTTP Scraping Tool
git clone git://git.acid.vegas/httpz.git
Log | Files | Refs | Archive | README | LICENSE

cli.py (7109B)

      1 #!/usr/bin/env python3
      2 # HTTPZ Web Scanner - Developed by acidvegas in Python (https://github.com/acidvegas/httpz)
      3 # httpz/cli.py
      4 
      5 import argparse
      6 import asyncio
      7 import logging
      8 import os
      9 import sys
     10 
     11 from .colors  import Colors
     12 from .scanner import HTTPZScanner
     13 from .utils   import SILENT_MODE, info
     14 
     15 def setup_logging(level='INFO', log_to_disk=False):
     16     '''
     17     Setup logging configuration
     18     
     19     :param level: Logging level (INFO or DEBUG)
     20     :param log_to_disk: Whether to also log to file
     21     '''
     22     class ColoredFormatter(logging.Formatter):
     23         def formatTime(self, record, datefmt=None):
     24             # Format: MM-DD HH:MM
     25             from datetime import datetime
     26             dt = datetime.fromtimestamp(record.created)
     27             return f"{Colors.GRAY}{dt.strftime('%m-%d %H:%M')}{Colors.RESET}"
     28         
     29         def format(self, record):
     30             return f'{self.formatTime(record)} {record.getMessage()}'
     31     
     32     handlers = []
     33     
     34     # Console handler
     35     console = logging.StreamHandler()
     36     console.setFormatter(ColoredFormatter())
     37     handlers.append(console)
     38     
     39     # File handler
     40     if log_to_disk:
     41         os.makedirs('logs', exist_ok=True)
     42         file_handler = logging.FileHandler(f'logs/httpz.log')
     43         file_handler.setFormatter(logging.Formatter('%(asctime)s - %(levelname)s - %(message)s'))
     44         handlers.append(file_handler)
     45     
     46     # Setup logger
     47     logging.basicConfig(
     48         level=getattr(logging, level.upper()),
     49         handlers=handlers
     50     )
     51 
     52 def parse_status_codes(codes_str: str) -> set:
     53     '''
     54     Parse comma-separated status codes and ranges into a set of integers
     55     
     56     :param codes_str: Comma-separated status codes (e.g., "200,301-399,404,500-503")
     57     '''
     58     
     59     codes = set()
     60     try:
     61         for part in codes_str.split(','):
     62             if '-' in part:
     63                 start, end = map(int, part.split('-'))
     64                 codes.update(range(start, end + 1))
     65             else:
     66                 codes.add(int(part))
     67         return codes
     68     except ValueError:
     69         raise argparse.ArgumentTypeError('Invalid status code format. Use comma-separated numbers or ranges (e.g., 200,301-399,404,500-503)')
     70 
     71 async def main():
     72     parser = argparse.ArgumentParser(
     73         description=f'{Colors.GREEN}Hyper-fast HTTP Scraping Tool{Colors.RESET}',
     74         formatter_class=argparse.RawDescriptionHelpFormatter
     75     )
     76 
     77     # Add arguments
     78     parser.add_argument('file', nargs='?', default='-', help='File containing domains to check (one per line), use - for stdin')
     79     parser.add_argument('-all', '--all-flags', action='store_true', help='Enable all output flags')
     80     parser.add_argument('-d', '--debug', action='store_true', help='Show error states and debug information')
     81     parser.add_argument('-c', '--concurrent', type=int, default=100, help='Number of concurrent checks')
     82     parser.add_argument('-j', '--jsonl', action='store_true', help='Output JSON Lines format to console')
     83     parser.add_argument('-o', '--output', help='Output file path (JSONL format)')
     84     
     85     # Output field flags
     86     parser.add_argument('-b', '--body', action='store_true', help='Show body preview')
     87     parser.add_argument('-cn', '--cname', action='store_true', help='Show CNAME records')
     88     parser.add_argument('-cl', '--content-length', action='store_true', help='Show content length')
     89     parser.add_argument('-ct', '--content-type', action='store_true', help='Show content type')
     90     parser.add_argument('-f', '--favicon', action='store_true', help='Show favicon hash')
     91     parser.add_argument('-fr', '--follow-redirects', action='store_true', help='Follow redirects (max 10)')
     92     parser.add_argument('-hr', '--headers', action='store_true', help='Show response headers')
     93     parser.add_argument('-i', '--ip', action='store_true', help='Show IP addresses')
     94     parser.add_argument('-sc', '--status-code', action='store_true', help='Show status code')
     95     parser.add_argument('-ti', '--title', action='store_true', help='Show page title')
     96     parser.add_argument('-tls', '--tls-info', action='store_true', help='Show TLS certificate information')
     97     
     98     # Other arguments
     99     parser.add_argument('-ax', '--axfr', action='store_true', help='Try AXFR transfer against nameservers')
    100     parser.add_argument('-ec', '--exclude-codes', type=parse_status_codes, help='Exclude these status codes (comma-separated, e.g., 404,500)')
    101     parser.add_argument('-mc', '--match-codes', type=parse_status_codes, help='Only show these status codes (comma-separated, e.g., 200,301,404)')
    102     parser.add_argument('-p', '--progress', action='store_true', help='Show progress counter')
    103     parser.add_argument('-r', '--resolvers', help='File containing DNS resolvers (one per line)')
    104     parser.add_argument('-to', '--timeout', type=int, default=5, help='Request timeout in seconds')
    105     
    106     args = parser.parse_args()
    107 
    108     # Setup logging based on arguments
    109     global SILENT_MODE
    110     SILENT_MODE = args.jsonl
    111 
    112     if not SILENT_MODE:
    113         if args.debug:
    114             setup_logging(level='DEBUG', log_to_disk=True)
    115         else:
    116             setup_logging(level='INFO')
    117 
    118         if args.file == '-':
    119             info('Reading domains from stdin')
    120         else:
    121             info(f'Processing file: {args.file}')
    122 
    123     # Setup show_fields
    124     show_fields = {
    125         'status_code'      : args.all_flags or args.status_code,
    126         'content_type'     : args.all_flags or args.content_type,
    127         'content_length'   : args.all_flags or args.content_length,
    128         'title'            : args.all_flags or args.title,
    129         'body'             : args.all_flags or args.body,
    130         'ip'               : args.all_flags or args.ip,
    131         'favicon'          : args.all_flags or args.favicon,
    132         'headers'          : args.all_flags or args.headers,
    133         'follow_redirects' : args.all_flags or args.follow_redirects,
    134         'cname'            : args.all_flags or args.cname,
    135         'tls'              : args.all_flags or args.tls_info
    136     }
    137 
    138     # If no fields specified show all
    139     if not any(show_fields.values()):
    140         show_fields = {k: True for k in show_fields}
    141 
    142     try:
    143         # Create scanner instance
    144         scanner = HTTPZScanner(
    145             concurrent_limit=args.concurrent,
    146             timeout=args.timeout,
    147             follow_redirects=args.all_flags or args.follow_redirects,
    148             check_axfr=args.axfr,
    149             resolver_file=args.resolvers,
    150             output_file=args.output,
    151             show_progress=args.progress,
    152             debug_mode=args.debug,
    153             jsonl_output=args.jsonl,
    154             show_fields=show_fields,
    155             match_codes=args.match_codes,
    156             exclude_codes=args.exclude_codes
    157         )
    158 
    159         # Run the scanner with file/stdin input
    160         await scanner.scan(args.file)
    161 
    162     except KeyboardInterrupt:
    163         logging.warning('Process interrupted by user')
    164         sys.exit(1)
    165     except Exception as e:
    166         logging.error(f'Unexpected error: {str(e)}')
    167         sys.exit(1)
    168 
    169 def run():
    170     '''Entry point for the CLI'''
    171     asyncio.run(main())
    172 
    173 if __name__ == '__main__':
    174     run()