Class: OxTenderAbstract::Client

Inherits:

Object

Object
OxTenderAbstract::Client

show all

Includes:: ContextualLogger

Defined in:: lib/oxtenderabstract/client.rb

Overview

Main client for working with Zakupki SOAP API

Instance Method Summary collapse

#download_archive_data(archive_url) ⇒ Object

Download and parse archive data.
#enhanced_search_tenders(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM, document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE, include_attachments: true) ⇒ Object

Enhanced search tenders with detailed information extraction.
#extract_attachments_from_xml(xml_content) ⇒ Object

Extract attachments info from XML.
#get_docs_by_reestr_number(reestr_number:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM) ⇒ Object

Get documents by registry number.
#get_docs_by_region(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM, document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE) ⇒ Object

Get documents by region and date.
#initialize(token: nil) ⇒ Client constructor

A new instance of Client.
#parse_xml_document(xml_content) ⇒ Object

Parse XML document.
#search_tenders(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM, document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE, include_attachments: true) ⇒ Object

Search tenders with full workflow: API -> Archive -> Parse.
#search_tenders_with_resume(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM, document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE, start_from_archive: 0, resume_state: nil, include_attachments: true) ⇒ Object

Search tenders with automatic resume capability Позволяет продолжить загрузку с места паузы при блокировках API.

Methods included from ContextualLogger

included, #log_debug, #log_error, #log_fatal, #log_info, #log_warn, #logger

Constructor Details

#initialize(token: nil) ⇒ `Client`

Returns a new instance of Client.

# File 'lib/oxtenderabstract/client.rb', line 20

def initialize(token: nil)
  @token = token || OxTenderAbstract.configuration.token
  @xml_parser = XmlParser.new
  @archive_processor = ArchiveProcessor.new
  validate_token!
end

Instance Method Details

#download_archive_data(archive_url) ⇒ `Object`

Download and parse archive data



63
64
65

# File 'lib/oxtenderabstract/client.rb', line 63

def download_archive_data(archive_url)
  @archive_processor.download_and_extract(archive_url)
end

#enhanced_search_tenders(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM, document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE, include_attachments: true) ⇒ `Object`

Enhanced search tenders with detailed information extraction

# File 'lib/oxtenderabstract/client.rb', line 175

def enhanced_search_tenders(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM,
                            document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE,
                            include_attachments: true)
  log_info "Starting enhanced tender search for region #{org_region}, date #{exact_date}"

  # Step 1: Get archive URLs from API
  api_result = get_docs_by_region(
    org_region: org_region,
    subsystem_type: subsystem_type,
    document_type: document_type,
    exact_date: exact_date
  )

  return api_result if api_result.failure?

  archive_urls = api_result.data[:archive_urls]
  return Result.success({ tenders: [], total_archives: 0, total_files: 0 }) if archive_urls.empty?

  log_info "Found #{archive_urls.size} archives to process"

  # Step 2: Process each archive with detailed information extraction
  all_tenders = []
  total_files = 0

  archive_urls.each_with_index do |archive_url, index|
    log_info "Processing archive #{index + 1}/#{archive_urls.size}"

    archive_result = download_archive_data(archive_url)
    next if archive_result.failure?

    files = archive_result.data[:files]
    total_files += files.size

    # Step 3: Parse XML files from archive with enhanced data extraction
    xml_files = files.select { |name, _| name.downcase.end_with?('.xml') }

    xml_files.each do |file_name, file_data|
      parse_result = parse_xml_document(file_data[:content])
      next if parse_result.failure?
      next unless parse_result.data[:document_type] == :tender

      tender_data = parse_result.data[:content]
      next if tender_data[:reestr_number].nil? || tender_data[:reestr_number].empty?

      # Step 4: Extract additional detailed information
      if include_attachments
        attachments_result = extract_attachments_from_xml(file_data[:content])
        if attachments_result.success?
          tender_data[:attachments] = attachments_result.data[:attachments]
          tender_data[:attachments_count] = attachments_result.data[:total_count]
        end
      end

      # Add metadata
      tender_data[:source_file] = file_name
      tender_data[:archive_url] = archive_url
      tender_data[:processed_at] = Time.now

      all_tenders << tender_data
    end
  end

  log_info "Enhanced search completed. Found #{all_tenders.size} tenders in #{total_files} files"

  Result.success({
                   tenders: all_tenders,
                   total_archives: archive_urls.size,
                   total_files: total_files,
                   processed_at: Time.now,
                   enhanced: true
                 })
end

#extract_attachments_from_xml(xml_content) ⇒ `Object`

Extract attachments info from XML



73
74
75

# File 'lib/oxtenderabstract/client.rb', line 73

def extract_attachments_from_xml(xml_content)
  @xml_parser.extract_attachments(xml_content)
end

#get_docs_by_reestr_number(reestr_number:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM) ⇒ `Object`

Get documents by registry number

# File 'lib/oxtenderabstract/client.rb', line 42

def get_docs_by_reestr_number(reestr_number:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM)
  validate_params!({
                     reestr_number: reestr_number,
                     subsystem_type: subsystem_type
                   })

  request_data = build_reestr_request(reestr_number, subsystem_type)
  log_info "Requesting documents for registry number: #{reestr_number}, type: #{subsystem_type}"

  result = execute_soap_request(:get_docs_by_reestr_number, request_data)

  if result.success?
    log_info "Success response for #{reestr_number}. Found archives: #{result.data[:archive_urls]&.size || 0}"
  else
    log_error "Error for #{reestr_number}: #{result.error}"
  end

  result
end

#get_docs_by_region(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM, document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE) ⇒ `Object`

Get documents by region and date

# File 'lib/oxtenderabstract/client.rb', line 28

def get_docs_by_region(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM,
                       document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE)
  validate_params!({
                     org_region: org_region,
                     subsystem_type: subsystem_type,
                     document_type: document_type,
                     exact_date: exact_date
                   })

  request_data = build_region_request(org_region, subsystem_type, document_type, exact_date)
  execute_soap_request(:get_docs_by_org_region, request_data)
end

#parse_xml_document(xml_content) ⇒ `Object`

Parse XML document



68
69
70

# File 'lib/oxtenderabstract/client.rb', line 68

def parse_xml_document(xml_content)
  @xml_parser.parse(xml_content)
end

#search_tenders(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM, document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE, include_attachments: true) ⇒ `Object`

Search tenders with full workflow: API -> Archive -> Parse

# File 'lib/oxtenderabstract/client.rb', line 78

def search_tenders(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM,
                   document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE, include_attachments: true)
  log_info "Starting tender search for region #{org_region}, date #{exact_date}, subsystem: #{subsystem_type}, type: #{document_type}"

  # Step 1: Get archive URLs from API
  api_result = get_docs_by_region(
    org_region: org_region,
    subsystem_type: subsystem_type,
    document_type: document_type,
    exact_date: exact_date
  )

  return api_result if api_result.failure?

  archive_urls = api_result.data[:archive_urls]
  return Result.success({ tenders: [], total_archives: 0, total_files: 0 }) if archive_urls.empty?

  log_info "Found #{archive_urls.size} archives to process"

  # Step 2: Process each archive with error resilience
  all_tenders = []
  total_files = 0
  processed_archives = 0
  failed_archives = 0

  archive_urls.each_with_index do |archive_url, index|
    log_info "Processing archive #{index + 1}/#{archive_urls.size}"

    begin
      archive_result = download_archive_data(archive_url)

      if archive_result.failure?
        log_error "Failed to download archive #{index + 1}: #{archive_result.error}"
        failed_archives += 1
        next
      end

      processed_archives += 1
      files = archive_result.data[:files]
      total_files += files.size

      # Step 3: Parse XML files from archive
      xml_files = files.select { |name, _| name.downcase.end_with?('.xml') }
      log_debug "Found #{xml_files.size} XML files in archive #{index + 1}"

      xml_files.each do |file_name, file_data|
        parse_result = parse_xml_document(file_data[:content])

        if parse_result.failure?
          log_debug "Failed to parse #{file_name}: #{parse_result.error}"
          next
        end

        next unless parse_result.data[:document_type] == :tender

        tender_data = parse_result.data[:content]
        next if tender_data[:reestr_number].nil? || tender_data[:reestr_number].empty?

        # Extract attachments if requested
        if include_attachments
          attachments_result = extract_attachments_from_xml(file_data[:content])
          if attachments_result.success?
            tender_data[:attachments] = attachments_result.data[:attachments]
            tender_data[:attachments_count] = attachments_result.data[:total_count]
          end
        end

        # Add metadata
        tender_data[:source_file] = file_name
        tender_data[:archive_url] = archive_url
        tender_data[:processed_at] = Time.now

        all_tenders << tender_data
      rescue StandardError => e
        log_error "Error processing file #{file_name}: #{e.message}"
        # Continue with other files
      end
    rescue StandardError => e
      log_error "Critical error processing archive #{index + 1}: #{e.message}"
      failed_archives += 1
      # Continue with other archives
    end
  end

  log_info "Search completed. Processed: #{processed_archives}/#{archive_urls.size} archives, Failed: #{failed_archives}, Found #{all_tenders.size} tenders in #{total_files} files"

  Result.success({
                   tenders: all_tenders,
                   total_archives: archive_urls.size,
                   processed_archives: processed_archives,
                   failed_archives: failed_archives,
                   total_files: total_files,
                   processed_at: Time.now
                 })
end

#search_tenders_with_resume(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM, document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE, start_from_archive: 0, resume_state: nil, include_attachments: true) ⇒ `Object`

Search tenders with automatic resume capability Позволяет продолжить загрузку с места паузы при блокировках API

# File 'lib/oxtenderabstract/client.rb', line 250

def search_tenders_with_resume(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM,
                               document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE,
                               start_from_archive: 0, resume_state: nil, include_attachments: true)
  log_info "Starting tender search with resume capability for region #{org_region}, date #{exact_date}"
  log_info "Starting from archive #{start_from_archive}" if start_from_archive > 0

  # Восстанавливаем состояние если есть
  if resume_state
    log_info "Resuming from previous state: #{resume_state[:processed_archives]} archives processed"
    all_tenders = resume_state[:tenders] || []
    total_files = resume_state[:total_files] || 0
    processed_archives = resume_state[:processed_archives] || 0
    failed_archives = resume_state[:failed_archives] || 0
    archive_urls = resume_state[:archive_urls]
  else
    # Step 1: Get archive URLs from API
    api_result = get_docs_by_region(
      org_region: org_region,
      subsystem_type: subsystem_type,
      document_type: document_type,
      exact_date: exact_date
    )

    return api_result if api_result.failure?

    archive_urls = api_result.data[:archive_urls]
    return Result.success({ tenders: [], total_archives: 0, total_files: 0 }) if archive_urls.empty?

    all_tenders = []
    total_files = 0
    processed_archives = 0
    failed_archives = 0
  end

  log_info "Found #{archive_urls.size} archives to process (starting from #{start_from_archive})"

  # Step 2: Process archives starting from specified position
  (start_from_archive...archive_urls.size).each do |index|
    archive_url = archive_urls[index]
    log_info "Processing archive #{index + 1}/#{archive_urls.size}"

    begin
      archive_result = download_archive_data(archive_url)

      if archive_result.failure?
        # Проверяем, была ли блокировка с автоматическим ожиданием
        if archive_result.metadata[:error_type] == :blocked &&
           !OxTenderAbstract.configuration.auto_wait_on_block
          # Возвращаем состояние для возможности продолжения
          resume_state = {
            tenders: all_tenders,
            total_files: total_files,
            processed_archives: processed_archives,
            failed_archives: failed_archives,
            archive_urls: archive_urls,
            next_archive_index: index
          }

          return Result.failure(
            "Archive download blocked, can resume from archive #{index + 1}",
            error_type: :blocked,
            retry_after: 600,
            resume_state: resume_state
          )
        else
          log_error "Failed to download archive #{index + 1}: #{archive_result.error}"
          failed_archives += 1
          next
        end
      end

      processed_archives += 1
      files = archive_result.data[:files]
      total_files += files.size

      # Step 3: Parse XML files from archive
      xml_files = files.select { |name, _| name.downcase.end_with?('.xml') }
      log_debug "Found #{xml_files.size} XML files in archive #{index + 1}"

      xml_files.each do |file_name, file_data|
        parse_result = parse_xml_document(file_data[:content])

        if parse_result.failure?
          log_debug "Failed to parse #{file_name}: #{parse_result.error}"
          next
        end

        next unless parse_result.data[:document_type] == :tender

        tender_data = parse_result.data[:content]
        next if tender_data[:reestr_number].nil? || tender_data[:reestr_number].empty?

        # Extract attachments if requested
        if include_attachments
          attachments_result = extract_attachments_from_xml(file_data[:content])
          if attachments_result.success?
            tender_data[:attachments] = attachments_result.data[:attachments]
            tender_data[:attachments_count] = attachments_result.data[:total_count]
          end
        end

        # Add metadata
        tender_data[:source_file] = file_name
        tender_data[:archive_url] = archive_url
        tender_data[:processed_at] = Time.now
        tender_data[:archive_index] = index

        all_tenders << tender_data
      rescue StandardError => e
        log_error "Error processing file #{file_name}: #{e.message}"
        # Continue with other files
      end
    rescue StandardError => e
      log_error "Critical error processing archive #{index + 1}: #{e.message}"
      failed_archives += 1
      # Continue with other archives
    end
  end

  log_info "Search completed. Processed: #{processed_archives}/#{archive_urls.size} archives, Failed: #{failed_archives}, Found #{all_tenders.size} tenders in #{total_files} files"

  Result.success({
                   tenders: all_tenders,
                   total_archives: archive_urls.size,
                   processed_archives: processed_archives,
                   failed_archives: failed_archives,
                   total_files: total_files,
                   processed_at: Time.now,
                   completed: true
                 })
end

Class: OxTenderAbstract::Client

Overview

Instance Method Summary collapse

Methods included from ContextualLogger

Constructor Details

#initialize(token: nil) ⇒ Client

Instance Method Details

#download_archive_data(archive_url) ⇒ Object

#enhanced_search_tenders(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM, document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE, include_attachments: true) ⇒ Object

#extract_attachments_from_xml(xml_content) ⇒ Object

#get_docs_by_reestr_number(reestr_number:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM) ⇒ Object

#get_docs_by_region(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM, document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE) ⇒ Object

#parse_xml_document(xml_content) ⇒ Object

#search_tenders(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM, document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE, include_attachments: true) ⇒ Object

#search_tenders_with_resume(org_region:, exact_date:, subsystem_type: DocumentTypes::DEFAULT_SUBSYSTEM, document_type: DocumentTypes::DEFAULT_DOCUMENT_TYPE, start_from_archive: 0, resume_state: nil, include_attachments: true) ⇒ Object