方式1
def get_file_content_chrome(driver, uri):
result = driver.execute_async_script("""
var uri = arguments[0];
var callback = arguments[1];
var toBase64 = function(buffer){for(var r,n=new Uint8Array(buffer),t=n.length,a=new Uint8Array(4*Math.ceil(t/3)),i=new Uint8Array(64),o=0,c=0;64>c;++c)i[c]="ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/".charCodeAt(c);for(c=0;t-t%3>c;c+=3,o+=4)r=n[c]<<16|n[c+1]<<8|n[c+2],a[o]=i[r>>18],a[o+1]=i[r>>12&63],a[o+2]=i[r>>6&63],a[o+3]=i[63&r];return t%3===1?(r=n[t-1],a[o]=i[r>>2],a[o+1]=i[r<<4&63],a[o+2]=61,a[o+3]=61):t%3===2&&(r=(n[t-2]<<8)+n[t-1],a[o]=i[r>>10],a[o+1]=i[r>>4&63],a[o+2]=i[r<<2&63],a[o+3]=61),new TextDecoder("ascii").decode(a)};
var xhr = new XMLHttpRequest();
xhr.responseType = 'arraybuffer';
xhr.onload = function(){ callback(toBase64(xhr.response)) };
xhr.onerror = function(){ callback(xhr.status) };
xhr.open('GET', uri);
xhr.send();
""", uri)
if type(result) == int:
raise Exception("Request failed with status %s" % result)
return base64.b64decode(result)
bytes_data = get_file_content_chrome(driver, "blob:https://amazon-api.arkoselabs.com/8784ddf9-bbd2-48a6-b529-fc2bfcdaaebc")
# print('bytes_data:', bytes_data)
base64data0 = base64.b64encode(bytes_data).decode("utf8")
print('base64data0:', base64data0)
with open(f'./captcha0.jpg', 'wb') as file:
file.write(bytes_data)
方式2
js_img = '''function getImageBlob(url, cb) {
var xhr = new XMLHttpRequest();
xhr.open("get", url, true);
xhr.responseType = "blob";
xhr.onload = function() {
if (this.status == 200) {
if(cb) cb(this.response);
}
};
xhr.send();
}
function preView(url){
let reader = new FileReader();
getImageBlob( url , function(blob){
reader.readAsDataURL(blob);
});
reader.onload = function(e) {
img = document.querySelector('img#captchaimg')
if(img){
img.src = e.target.result;
document.body.appendChild(img);
}else{
var img = document.createElement("img");
img.id = 'captchaimg'
img.src = e.target.result;
document.body.appendChild(img);
}
}
}
preView("blob_image")'''
driver.execute_script(js_img.replace('blob_image', blob_image))
time.sleep(2)
captchaimg = driver.find_element(By.XPATH, '//img[@id="captchaimg"]').get_attribute('src')
print('captchaimg:', captchaimg)
base64data = captchaimg.split('base64,')[1]
with io.BytesIO(b64decode(base64data)) as image_file:
image = Image.open(image_file)
image.save('./captcha.jpg')
content_to_bytes = bytes(captchaimg.split('base64,')[1], 'utf-8')
with open(f'./captcha1.jpg', 'wb') as file:
file.write(base64.decodebytes(content_to_bytes))