mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 04:14:52 +00:00
Hotfixing idefics base64 parsing.
This commit is contained in:
parent
3c373dcc53
commit
4930a9d8b7
@ -201,8 +201,13 @@ class IdeficsImageProcessor(BaseImageProcessor):
|
|||||||
response = requests.get(image_url_or_urls, stream=True, headers=headers, timeout=(1, 5))
|
response = requests.get(image_url_or_urls, stream=True, headers=headers, timeout=(1, 5))
|
||||||
response.raise_for_status()
|
response.raise_for_status()
|
||||||
content = response.content
|
content = response.content
|
||||||
else:
|
elif image.startswith("data:"):
|
||||||
|
# https://stackoverflow.com/questions/17090571/is-there-a-way-to-set-background-image-as-a-base64-encoded-image
|
||||||
|
# 
|
||||||
|
image = image.split(",")[-1]
|
||||||
content = base64.b64decode(image)
|
content = base64.b64decode(image)
|
||||||
|
else:
|
||||||
|
raise ValueError(f"Unrecognized image {image}")
|
||||||
|
|
||||||
try:
|
try:
|
||||||
image = Image.open(BytesIO(content))
|
image = Image.open(BytesIO(content))
|
||||||
|
@ -112,6 +112,11 @@ def is_url(string):
|
|||||||
result = urlparse(string)
|
result = urlparse(string)
|
||||||
return all([result.scheme, result.netloc])
|
return all([result.scheme, result.netloc])
|
||||||
|
|
||||||
|
def is_image(string):
|
||||||
|
"""Checks if the passed string contains a valid url and nothing else. e.g. if space is included it's immediately
|
||||||
|
invalidated the url"""
|
||||||
|
return is_url(string) or string.startswith("data:")
|
||||||
|
|
||||||
|
|
||||||
class IdeficsProcessor(ProcessorMixin):
|
class IdeficsProcessor(ProcessorMixin):
|
||||||
r"""
|
r"""
|
||||||
@ -314,7 +319,7 @@ class IdeficsProcessor(ProcessorMixin):
|
|||||||
|
|
||||||
if isinstance(item, str):
|
if isinstance(item, str):
|
||||||
item = item.strip(" ")
|
item = item.strip(" ")
|
||||||
if is_url(item):
|
if is_image(item):
|
||||||
image = self.image_processor.fetch_images(item)
|
image = self.image_processor.fetch_images(item)
|
||||||
full_text += image_tokens(last_was_image)
|
full_text += image_tokens(last_was_image)
|
||||||
image_objects.append(image)
|
image_objects.append(image)
|
||||||
@ -339,6 +344,7 @@ class IdeficsProcessor(ProcessorMixin):
|
|||||||
|
|
||||||
image_objects = self.image_processor(image_objects, transform=transform)
|
image_objects = self.image_processor(image_objects, transform=transform)
|
||||||
|
|
||||||
|
|
||||||
text_encoding = self.tokenizer(
|
text_encoding = self.tokenizer(
|
||||||
text=full_text,
|
text=full_text,
|
||||||
add_special_tokens=False,
|
add_special_tokens=False,
|
||||||
|
Loading…
Reference in New Issue
Block a user