Last active
December 4, 2025 07:02
-
-
Save matsubo/c1366c36b1045484a00d0756ab082f3a to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| #!/bin/bash | |
| # Please ensure GOOGLE_API_KEY is set. | |
| # The key can be found: https://aistudio.google.com/apps | |
| # Create test.xlsx file | |
| echo "" | base64 -d > test.xlsx | |
| # Download PoC script | |
| curl https://gist.githubusercontent.com/matsubo/c1366c36b1045484a00d0756ab082f3a/raw/poc_mime_type_issue.py > poc_mime_type_issue.py | |
| # Execute | |
| python poc_mime_type_issue.py | |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| """ | |
| Proof of Concept: MIME Type Validation issue in uploadToFileSearchStore API | |
| This script demonstrates a server-side validation issue where the API rejects a | |
| valid MIME type for Excel files (.xlsx). | |
| Error: 400 INVALID_ARGUMENT | |
| Message: "When provided, MIME type must be in a valid type/subtype format" | |
| MIME Type Used: application/vnd.openxmlformats-officedocument.spreadsheetml.sheet | |
| Issue: The MIME type IS in valid type/subtype format, but the API incorrectly rejects it. | |
| """ | |
| from google import genai | |
| from google.genai import types | |
| import time | |
| import os | |
| from dotenv import load_dotenv | |
| # Load environment variables | |
| load_dotenv() | |
| # Get API key | |
| api_key = os.getenv('GOOGLE_API_KEY') | |
| if not api_key: | |
| raise ValueError("GOOGLE_API_KEY not found in environment variables") | |
| client = genai.Client(api_key=api_key) | |
| print("=" * 80) | |
| print("PoC: MIME Type issue in uploadToFileSearchStore API") | |
| print("=" * 80) | |
| # Preparation: Create a file search store | |
| print("\nPreparation: Creating file search store...") | |
| file_search_store = client.file_search_stores.create( | |
| config={'display_name': 'poc-mime-type-xlsx'} | |
| ) | |
| print(f" Created: {file_search_store.name}") | |
| # Step 1: Attempt to upload an Excel file with the correct MIME type | |
| print("\n1. Uploading Excel file (.xlsx) with correct MIME type...") | |
| test_file = "test.xlsx" | |
| mime_type = "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" | |
| print(f" File: {test_file}") | |
| print(f" MIME Type: {mime_type}") | |
| print(f" Note: This MIME type is the official IANA-registered type for .xlsx files") | |
| try: | |
| with open(test_file, 'rb') as f: | |
| operation = client.file_search_stores.upload_to_file_search_store( | |
| file=f, | |
| file_search_store_name=file_search_store.name, | |
| config={ | |
| 'display_name': 'test.xlsx', | |
| 'mime_type': mime_type # VALID MIME TYPE | |
| } | |
| ) | |
| # Wait for completion | |
| while not operation.done: | |
| time.sleep(2) | |
| operation = client.operations.get(operation) | |
| print("\n ✓ SUCCESS: File uploaded successfully") | |
| except Exception as e: | |
| print("\n ✗ ERROR: Upload failed") | |
| print(f"\n{e}") | |
| print("\n" + "=" * 80) | |
| print("ISSUE CONFIRMED") | |
| print("=" * 80) | |
| print("The API incorrectly rejects the MIME type:") | |
| print(f" {mime_type}") | |
| print("\nThis is a valid IANA-registered MIME type in 'type/subtype' format.") | |
| print("Expected: API should accept this MIME type") | |
| print("Actual: API returns 400 INVALID_ARGUMENT") | |
| print("=" * 80) | |
| # Step 2: Try without mime_type to see if it works | |
| print("\n\n2. Testing upload WITHOUT mime_type parameter...") | |
| try: | |
| with open(test_file, 'rb') as f: | |
| operation = client.file_search_stores.upload_to_file_search_store( | |
| file=f, | |
| file_search_store_name=file_search_store.name, | |
| config={ | |
| 'display_name': 'test-without-mimetype.xlsx' | |
| # NO mime_type specified | |
| } | |
| ) | |
| # Wait for completion | |
| while not operation.done: | |
| time.sleep(2) | |
| operation = client.operations.get(operation) | |
| print(" ✓ SUCCESS: File uploaded without mime_type parameter") | |
| print("\n This confirms the issue: The API works when mime_type is omitted,") | |
| print(" but fails when the correct mime_type is provided.") | |
| except Exception as e: | |
| print(f"\n ✗ Also failed without mime_type: {e}") | |
| # Step 3: Try alternative approach - upload via File API then import | |
| print("\n\n3. Testing alternative approach: File API upload → import to store...") | |
| print(" This tests if using client.files.upload() + import_file() works better") | |
| try: | |
| # Upload file using File API | |
| with open(test_file, 'rb') as f: | |
| file_ref = client.files.upload( | |
| file=f, | |
| config=types.UploadFileConfig( | |
| display_name='test-via-file-api.xlsx', | |
| mime_type=mime_type | |
| ) | |
| ) | |
| print(f" ✓ Uploaded via File API: {file_ref.name}") | |
| # Import the uploaded file into the file search store | |
| import_op = client.file_search_stores.import_file( | |
| file_search_store_name=file_search_store.name, | |
| file_name=file_ref.name, | |
| ) | |
| print(f" File import started: {import_op.name}") | |
| print(" Waiting for import to complete", end="") | |
| while not (import_op := client.operations.get(import_op)).done: | |
| time.sleep(1) | |
| print(".", end="", flush=True) | |
| print() | |
| print(" ✓ SUCCESS: File imported successfully via File API → import_file()") | |
| print("\n This approach works! Use File API upload + import as a workaround.") | |
| except Exception as e: | |
| print(f"\n ✗ Failed with File API approach: {e}") | |
| print("\n" + "=" * 80) | |
| print("PoC Complete") | |
| print("=" * 80) | |
| print("\nSUMMARY:") | |
| print(" Step 1 (direct upload with mime_type): Expected to fail") | |
| print(" Step 2 (direct upload without mime_type): May work") | |
| print(" Step 3 (File API + import): Recommended workaround") | |
| print("=" * 80) |
Author
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
Output
pakcage version