T0nyX1ang/WHU-ScoreChecker

View on GitHub
scorechecker/image/predict.py

Summary

Maintainability
A
0 mins
Test Coverage
"""
Predict the captcha from an image downloaded from a certain pattern.

The pattern is based on the captcha model.
The captcha model should be a Keras-loaded model Object that has a function
'predict'.
This function utilized partition and process function.
"""

import numpy
from .process import preprocess, resize, otsu
from .partition import partition


def predict_captcha(bytes_im, model):
    """
    Main predict function.

    'bytes_im' is a bytes image which is downloaded on Internet.
    'model' is a Keras sequence model Object.
    """
    captcha = ''
    convert = '0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz'
    if bytes_im is None:
        print('You should load an image to predict its captcha.')
        return captcha

    if model:
        array_im = numpy.asarray(bytearray(bytes_im), dtype='uint8')
        proc_im = preprocess(array_im)
        parts = partition(proc_im)
        for val in parts:
            crop = proc_im[val[1]:val[1] + val[3], val[0]:val[0] + val[2]]
            letter = resize(crop, width=20, height=20)
            letter = otsu(letter)  # threshold again for more simple image
            letter = numpy.expand_dims(letter, axis=2) // 255
            letter = numpy.expand_dims(letter, axis=0)
            prediction = model.predict(letter)  # predict the letter
            captcha += convert[numpy.argmax(prediction)]
    return captcha