Find orderly but empty string in an array

topic

Given a string array arr, arr Some None position, but not the position of None, ordered string. Given a string s, returns the leftmost position s occurring in the arr.
As = ARR [None, 'A', None, 'A', None, 'B, None,' C ']
S =' A ', returns. 1
S None = -1
S =' D ', -1

Thinking

Possible use binary search, if found during half None position, has to traverse to find a location to one side is not None, depending on the size and location of the string, which is determined to continue the half-half.

Achieve 1

def search_string(arr, s):
    left = 0
    right = len(arr) - 1
    result = -1

    while left <= right:
        m = (left + right) // 2
        if arr[m] is not None:
            if arr[m] == s:
                result = m
                right = m - 1
            elif arr[m] < s:
                left = m + 1
            else:
                right = m - 1
        else:
            i = m
            while i >= left and arr[i] is None:
                i -= 1

            if i < left or arr[i] < s:
                left = m + 1
            elif arr[i] == s:
                result = i
                right = i - 1
            else:
                right = i - 1

    return result

Another way

To find the equivalent of the left-most position, similar to lower_bound, but can not find the need to return -1, personally I prefer a lower_bound wording:

def lower_bound(nums, target):
    begin = 0
    end = len(nums)

    while begin < end:
        mid = (begin + end) // 2
        if nums[mid] < target:
            begin = mid + 1
        else:
            end = mid

    return begin

A similar method to solve the problem:

def search_string2(arr, s):
    left = 0
    right = len(arr)

    while left < right:
        m = (left + right) // 2
        if arr[m] is not None:
            if arr[m] < s:
                left = m + 1
            else:
                right = m
        else:
            i = m
            while i >= left and arr[i] is None:
                i -= 1

            if i < left or arr[i] < s:
                left = m + 1
            else:
                right = i

    return left if left < len(arr) and arr[left] == s else -1

test

def test_search_string():
    arr = [None, None, 'a', None, None, 'b', 'c', None, 'd',
           None, None, 'e', 'f', 'g', None, 'h', None, 'i']

    print(search_string(arr, 'A'), search_string2(arr, 'A'))
    print(search_string(arr, 'a'), search_string2(arr, 'a'))
    print(search_string(arr, 'b'), search_string2(arr, 'b'))
    print(search_string(arr, 'c'), search_string2(arr, 'c'))
    print(search_string(arr, 'd'), search_string2(arr, 'd'))
    print(search_string(arr, 'e'), search_string2(arr, 'e'))
    print(search_string(arr, 'f'), search_string2(arr, 'f'))
    print(search_string(arr, 'g'), search_string2(arr, 'g'))
    print(search_string(arr, 'h'), search_string2(arr, 'h'))
    print(search_string(arr, 'i'), search_string2(arr, 'i'))
    print(search_string(arr, 'j'), search_string2(arr, 'j'))

    arr = []
    for i in range(100):
        size = random.randint(0, 26)
        s = ''.join(random.sample(string.ascii_letters+string.digits, size))
        arr.append(s)

    arr = sorted(arr)
    for i in range(100):
        arr.insert(random.randint(0, len(arr)), None)

    for i in range(len(arr)):
        s = arr[i]
        if s is None:
            size = random.randint(0, 26)
            s = ''.join(random.sample(string.ascii_letters, size))
            if s not in arr:
                assert(search_string2(arr, s) == search_string(arr, s))
        else:
            assert(search_string2(arr, s) == search_string(arr, s))

    print('pass')


if __name__ == '__main__':
    test_search_string()
Published 217 original articles · won praise 132 · views 320 000 +

Guess you like

Origin blog.csdn.net/guzhou_diaoke/article/details/103939351