1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123
use bytes::Bytes;
use serde::Serialize;
use crate::{
config::Config,
error::OpenAIError,
types::{CreateFileRequest, DeleteFileResponse, ListFilesResponse, OpenAIFile},
Client,
};
/// Files are used to upload documents that can be used with features like Assistants and Fine-tuning.
pub struct Files<'c, C: Config> {
client: &'c Client<C>,
}
impl<'c, C: Config> Files<'c, C> {
pub fn new(client: &'c Client<C>) -> Self {
Self { client }
}
/// Upload a file that can be used across various endpoints. Individual files can be up to 512 MB, and the size of all files uploaded by one organization can be up to 100 GB.
///
/// The Assistants API supports files up to 2 million tokens and of specific file types. See the [Assistants Tools guide](https://platform.openai.com/docs/assistants/tools) for details.
///
/// The Fine-tuning API only supports `.jsonl` files. The input also has certain required formats for fine-tuning [chat](https://platform.openai.com/docs/api-reference/fine-tuning/chat-input) or [completions](https://platform.openai.com/docs/api-reference/fine-tuning/completions-input) models.
///
///The Batch API only supports `.jsonl` files up to 100 MB in size. The input also has a specific required [format](https://platform.openai.com/docs/api-reference/batch/request-input).
///
/// Please [contact us](https://help.openai.com/) if you need to increase these storage limits.
pub async fn create(&self, request: CreateFileRequest) -> Result<OpenAIFile, OpenAIError> {
self.client.post_form("/files", request).await
}
/// Returns a list of files that belong to the user's organization.
pub async fn list<Q>(&self, query: &Q) -> Result<ListFilesResponse, OpenAIError>
where
Q: Serialize + ?Sized,
{
self.client.get_with_query("/files", query).await
}
/// Returns information about a specific file.
pub async fn retrieve(&self, file_id: &str) -> Result<OpenAIFile, OpenAIError> {
self.client.get(format!("/files/{file_id}").as_str()).await
}
/// Delete a file.
pub async fn delete(&self, file_id: &str) -> Result<DeleteFileResponse, OpenAIError> {
self.client
.delete(format!("/files/{file_id}").as_str())
.await
}
/// Returns the contents of the specified file
pub async fn content(&self, file_id: &str) -> Result<Bytes, OpenAIError> {
self.client
.get_raw(format!("/files/{file_id}/content").as_str())
.await
}
}
#[cfg(test)]
mod tests {
use crate::{
types::{CreateFileRequestArgs, FilePurpose},
Client,
};
#[tokio::test]
async fn test_file_mod() {
let test_file_path = "/tmp/test.jsonl";
let contents = concat!(
"{\"prompt\": \"<prompt text>\", \"completion\": \"<ideal generated text>\"}\n", // \n is to make it valid jsonl
"{\"prompt\": \"<prompt text>\", \"completion\": \"<ideal generated text>\"}"
);
tokio::fs::write(test_file_path, contents).await.unwrap();
let client = Client::new();
let request = CreateFileRequestArgs::default()
.file(test_file_path)
.purpose(FilePurpose::FineTune)
.build()
.unwrap();
let openai_file = client.files().create(request).await.unwrap();
assert_eq!(openai_file.bytes, 135);
assert_eq!(openai_file.filename, "test.jsonl");
//assert_eq!(openai_file.purpose, "fine-tune");
//assert_eq!(openai_file.status, Some("processed".to_owned())); // uploaded or processed
let query = [("purpose", "fine-tune")];
let list_files = client.files().list(&query).await.unwrap();
assert_eq!(list_files.data.into_iter().last().unwrap(), openai_file);
let retrieved_file = client.files().retrieve(&openai_file.id).await.unwrap();
assert_eq!(openai_file.created_at, retrieved_file.created_at);
assert_eq!(openai_file.bytes, retrieved_file.bytes);
assert_eq!(openai_file.filename, retrieved_file.filename);
assert_eq!(openai_file.purpose, retrieved_file.purpose);
/*
// "To help mitigate abuse, downloading of fine-tune training files is disabled for free accounts."
let retrieved_contents = client.files().retrieve_content(&openai_file.id)
.await
.unwrap();
assert_eq!(contents, retrieved_contents);
*/
// Sleep to prevent "File is still processing. Check back later."
tokio::time::sleep(std::time::Duration::from_secs(15)).await;
let delete_response = client.files().delete(&openai_file.id).await.unwrap();
assert_eq!(openai_file.id, delete_response.id);
assert!(delete_response.deleted);
}
}