123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148 |
- # Copyright 2019 the gRPC authors.
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- """A search algorithm over the space of all bytestrings."""
- from __future__ import absolute_import
- from __future__ import division
- from __future__ import print_function
- import base64
- import hashlib
- import itertools
- import logging
- import struct
- from examples.python.cancellation import hash_name_pb2
- _LOGGER = logging.getLogger(__name__)
- _BYTE_MAX = 255
- def _get_hamming_distance(a, b):
- """Calculates hamming distance between strings of equal length."""
- distance = 0
- for char_a, char_b in zip(a, b):
- if char_a != char_b:
- distance += 1
- return distance
- def _get_substring_hamming_distance(candidate, target):
- """Calculates the minimum hamming distance between between the target
- and any substring of the candidate.
- Args:
- candidate: The string whose substrings will be tested.
- target: The target string.
- Returns:
- The minimum Hamming distance between candidate and target.
- """
- min_distance = None
- if len(target) > len(candidate):
- raise ValueError("Candidate must be at least as long as target.")
- for i in range(len(candidate) - len(target) + 1):
- distance = _get_hamming_distance(candidate[i:i + len(target)].lower(),
- target.lower())
- if min_distance is None or distance < min_distance:
- min_distance = distance
- return min_distance
- def _get_hash(secret):
- hasher = hashlib.sha1()
- hasher.update(secret)
- return base64.b64encode(hasher.digest()).decode('ascii')
- class ResourceLimitExceededError(Exception):
- """Signifies the request has exceeded configured limits."""
- def _bytestrings_of_length(length):
- """Generates a stream containing all bytestrings of a given length.
- Args:
- length: A positive integer length.
- Yields:
- All bytestrings of length `length`.
- """
- for digits in itertools.product(range(_BYTE_MAX), repeat=length):
- yield b''.join(struct.pack('B', i) for i in digits)
- def _all_bytestrings():
- """Generates a stream containing all possible bytestrings.
- This generator does not terminate.
- Yields:
- All bytestrings in ascending order of length.
- """
- for bytestring in itertools.chain.from_iterable(
- _bytestrings_of_length(length) for length in itertools.count()):
- yield bytestring
- def search(target,
- ideal_distance,
- stop_event,
- maximum_hashes,
- interesting_hamming_distance=None):
- """Find candidate strings.
- Search through the space of all bytestrings, in order of increasing length,
- indefinitely, until a hash with a Hamming distance of `maximum_distance` or
- less has been found.
- Args:
- target: The search string.
- ideal_distance: The desired Hamming distance.
- stop_event: An event indicating whether the RPC should terminate.
- maximum_hashes: The maximum number of hashes to check before stopping.
- interesting_hamming_distance: If specified, strings with a Hamming
- distance from the target below this value will be yielded.
- Yields:
- Instances of HashNameResponse. The final entry in the stream will be of
- `maximum_distance` Hamming distance or less from the target string,
- while all others will be of less than `interesting_hamming_distance`.
- Raises:
- ResourceLimitExceededError: If the computation exceeds `maximum_hashes`
- iterations.
- """
- hashes_computed = 0
- for secret in _all_bytestrings():
- if stop_event.is_set():
- return
- candidate_hash = _get_hash(secret)
- distance = _get_substring_hamming_distance(candidate_hash, target)
- if interesting_hamming_distance is not None and distance <= interesting_hamming_distance:
- # Surface interesting candidates, but don't stop.
- yield hash_name_pb2.HashNameResponse(
- secret=base64.b64encode(secret),
- hashed_name=candidate_hash,
- hamming_distance=distance)
- elif distance <= ideal_distance:
- # Yield ideal candidate and end the stream.
- yield hash_name_pb2.HashNameResponse(
- secret=base64.b64encode(secret),
- hashed_name=candidate_hash,
- hamming_distance=distance)
- return
- hashes_computed += 1
- if hashes_computed == maximum_hashes:
- raise ResourceLimitExceededError()
|