# Image upload

Here is an example of creating a new dataset and uploading images to it with categories and annotations.

# Create a dataset

def create_dataset(dataset_name):
    request = {
        "name": dataset_name
    }
    response = requests.post(url=f'{OSAI_URL}/Datasets', headers=HEADERS, json=request).json()
    dataset_id = response["id"]
    return dataset_id

# Create a category

When using the API to upload images from categories, you will need to create the categories you need in advance so that when you upload images, you provide the correct id of the categories used in the dataset.

def create_category(dataset_id, category_name):
    request = {
        "datasetId": dataset_id,
        "name": category_name
    }
    response = requests.post(
        f'{OSAI_URL}/Categories', headers=HEADERS, json=request
    ).json()
    return respone

# Upload

# Start and end of upload

You must start the upload manually. The dataset will then be locked and you will be able to upload photos. Once you have finished uploading photos, you need to stop uploading to unlock the dataset. If you forget to do this, the dataset will automatically unlock itself after a certain period of time of not receiving new photos.

def start_uploading(dataset_id):
    response = requests.post(
        f'{OSAI_URL}/Datasets/{dataset_id}/StartUploading', headers=HEADERS
    ).json()
    return response


def finish_uploading(dataset_id, upload_id):
    response = requests.post(
        f'{OSAI_URL}/Datasets/{dataset_id}/FinishUploading', headers=HEADERS, params={"datasetUploadId": upload_id}
    )
    print(response)    

# Send images

def send_images(dataset_id, upload_id, path):
    images_data = get_images_data(path)
    categories_id = create_categories_for_images_data(images_data, dataset_id)

    for image in images_data:
        response = upload_image(dataset_id, categories_id, upload_id, image)
        print(response)

Photos are sent as multipart/form-data, which must include:

  • DatasetID
  • DatasetUploadID
  • ImagsMetadata - containing data such as:
    • name
    • annotationType
    • annotation
    • classifyCategoryId
  • ImagesFles
def upload_image(dataset_id, categories_id, upload_id, image):
    annotation = get_annotation(image)
    encoded_content = base64.b64encode(bytes(annotation['content'], 'utf-8'))
    file_name = image['name'] + image['extension']
    file_path= image['path'] + os.sep + file_name
    form_data = {
            'datasetId': dataset_id,
            'datasetUploadId': upload_id,
            'imagesMetadata[0][name]': file_name,
            'imagesMetadata[0][annotationType]': annotation['type'],
            'imagesMetadata[0][annotation]': encoded_content,
            'imagesMetadata[0][classifyCategoryId]': categories_id[image['category']],
        }
    files = {'imagesFiles': (file_name, open(file_path, 'rb'))} 
    response = requests.post(
            f'{OSAI_URL}/Images/UploadChunk',headers=HEADERS, 
            params={'skipUnsupportedImages': False}, data=form_data, files=files
        )
    
    return response

# Get image metadata

To make it easier to manage uploaded images, you can break down information about a photo by uploading classifications and annotations to it.

def get_images_data(path):    
    image_list =[] 
    for root, _dirs, files in os.walk(path):
        for file in files:
            suffix = pathlib.Path(file).suffix
            name = pathlib.Path(file).stem
            if suffix == '.jpg' or suffix == '.png':
                annotation = None
                if  os.path.isfile(root + os.sep + name + '.xml'):
                    annotation = '.xml'
                image_list.append({'path': root, 'name': name, 'extension': suffix, 'category': os.path.basename(root), 'annotation_file':annotation})
    
    return image_list           

# Add categories to upload

In this example, we use the parent folder to assign the classification.

def create_categories_for_images_data(images_data, dataset_id):
    categories = []
    categories_ids = {}
    for image in images_data:
        if image['category'] not in categories:
            categories.append(image['category'])
    for category in categories:
        categories_ids[category] = create_category(dataset_id, category)['id']
    
    return categories_ids

# Add .xml annotation to upload

The .xml files require that the metadata for the images include a valid annotationType so that the server will know how to decode the information it has. The .xml file should be uploaded as a encoded string in base64.

def get_annotation(image_data):
    annotation = {}
    if image_data['annotation_file'] == '.xml':
        file_path = image_data['path']+ os.sep + image_data['name'] + image_data['annotation_file']
        annotation['type']=0
        with open(file_path) as file:
            annotation['content'] = file.read()
    else:
        annotation['type']=None
        annotation['content'] = ''
    
    return annotation

# Example

import requests
import os
import pathlib
import base64

OSAI_URL = 'https://app-eu.onestepai.com/api'
API_TOKEN = 'OUR ACCESS TOKEN GENERATED IN OSAI'
HEADERS = {'Authorization': None}

def main():
    token = sign_in()
    global HEADERS   
    HEADERS = {'Authorization': f'Bearer {token.text}'}

    print('------Create dataset------')
    dataset_id = create_dataset('holy_hand_grenade')
    print('-----Uploading------')
    upload_id = start_uploading(dataset_id)
    send_images(dataset_id, upload_id, "zdj")
    finish_uploading(dataset_id, upload_id)


def sign_in():
    response = requests.post(
        url=f'{OSAI_URL}/Users/SignIn', json=API_TOKEN)
    return response


def create_dataset(dataset_name):
    request = {
        'name': dataset_name
    }
    response = requests.post(url=f'{OSAI_URL}/Datasets', headers=HEADERS, json = request).json()
    dataset_id = response['id']
    print(f'Dataset created with id: {dataset_id}')
    return dataset_id


def create_category(dataset_id, category_name):
    request = {
        'datasetId': dataset_id,
        'name': category_name
    }
    response = requests.post(
        f'{OSAI_URL}/Categories', headers=HEADERS, json=request
    ).json()
    return response


def send_images(dataset_id, upload_id, path):
    images_data = get_images_data(path)
    categories_id = create_categories_for_images_data(images_data, dataset_id)

    for image in images_data:
        response = upload_image(dataset_id, categories_id, upload_id, image)
        print(response)


def start_uploading(dataset_id):
    response = requests.post(
        f'{OSAI_URL}/Datasets/{dataset_id}/StartUploading', headers=HEADERS
    ).json()
    return response


def finish_uploading(dataset_id, upload_id):
    response = requests.post(
        f'{OSAI_URL}/Datasets/{dataset_id}/FinishUploading', headers=HEADERS, params={'datasetUploadId': upload_id}
    )
    print(response)    


def upload_image(dataset_id, categories_id, upload_id, image):
    annotation = get_annotation(image)
    encoded_content = base64.b64encode(bytes(annotation['content'], 'utf-8'))
    file_name = image['name'] + image['extension']
    file_path= image['path'] + os.sep + file_name
    form_data = {
            'datasetId': dataset_id,
            'datasetUploadId': upload_id,
            'imagesMetadata[0][name]': file_name,
            'imagesMetadata[0][annotationType]': annotation['type'],
            'imagesMetadata[0][annotation]': encoded_content,
            'imagesMetadata[0][classifyCategoryId]': categories_id[image['category']],
        }
    files = {'imagesFiles': (file_name, open(file_path, 'rb'))} 
    response = requests.post(
            f'{OSAI_URL}/Images/UploadChunk',headers=HEADERS, 
            params={'skipUnsupportedImages': False}, data=form_data, files=files
        )
    
    return response


def get_annotation(image_data):
    annotation = {}
    if image_data['annotation_file'] == '.xml':
        file_path = image_data['path']+ os.sep + image_data['name'] + image_data['annotation_file']
        annotation['type']=0
        with open(file_path) as file:
            annotation['content'] = file.read()
    else:
        annotation['type']=None
        annotation['content'] = ''
    
    return annotation


def create_categories_for_images_data(images_data, dataset_id):
    categories = []
    categories_ids = {}
    for image in images_data:
        if image['category'] not in categories:
            categories.append(image['category'])
    for category in categories:
        categories_ids[category] = create_category(dataset_id, category)['id']
    
    return categories_ids


def get_images_data(path):    
    image_list =[] 
    for root, _dirs, files in os.walk(path):
        for file in files:
            suffix = pathlib.Path(file).suffix
            name = pathlib.Path(file).stem
            if suffix == '.jpg' or suffix == '.png':
                annotation = None
                if  os.path.isfile(root + os.sep + name + '.xml'):
                    annotation = '.xml'
                image_list.append({'path': root, 'name': name, 'extension': suffix, 'category': os.path.basename(root), 'annotation_file': annotation})
    
    return image_list           
                

if __name__ == '__main__':
    main()
------Create dataset------
Dataset created with id: 514
-----Uploading------
<Response [200]>
<Response [200]>
<Response [200]>
<Response [200]>
<Response [200]>
<Response [200]>
<Response [200]>
<Response [200]>
<Response [200]>