22:["$","$L48",null,{"formats":"$undefined","locale":"en","messages":{"about":{"a_world_where_any_company":"A world where any company can use generative AI.","advisor":{"Career1":"Former COO of Moloco, pre-IPO AI company with $250M+ revenue","Degree":"M.S., Operations Research and Industrial Engineering, Cornell University","name":"Brian Yoo","role":"Advisor"},"by_eliminating_complexities":"By eliminating the complexities of generative AI serving, we aim to empower more companies to achieve innovation with generative AI.","ceo":{"Career1":"Visiting Research Scientist, Facebook","Career2":"Principal Scientist, Microsoft","Career3":"Research Scientist, Yahoo!","Career4":"Research Scientist, Intel","Degree1":"Ph.D., Computer Science, University of California, Berkeley","Degree2":"M.S., Computer Science, Stanford University","Professor":"Professor, Computer Science and Engineering Department, Seoul National University (Sabbatical Leave)","name":"Byung-Gon Chun","role":"Founder & CEO"},"coo":{"Career1":"Former CEO and Co-Founder of Qeexo acquired by TDK","Degree":"MBA, Haas School of Business at UC Berkeley","name":"Sang-won Lee","role":"COO"},"cto":{"Degree":"Ph.D., Computer Science and Engineering, Seoul National University","name":"Gyeong-In Yu","role":"CTO"},"efficient_automated_gen_ai_model_serving":"Efficient, automated generative AI model serving.","empowering_orgs_to_harness":"Empowering organizations to harness the full potential of generative AI models with ease and cost-efficiency.","leadership":"LEADERSHIP","leading_the_development":"Leading the development of generative AI serving with a brilliant team","mission":"MISSION","serving_generative_ai_for_all":"Serving Generative AI for All","we_believe_efficient_and_scalable_use":"We believe that the efficient and scalable use of generative AI models should be for everyone."},"annex":{"here":"here","performance_compared_to_vllm":"2. Performance compared to vLLM on a single NVIDIA A100 80GB GPU running AWQ-ed Mixtral 8x7B from Mistral AI with the following settings: mean input token length = 500, mean output token length = 150. Evaluation conducted by FriendliAI.","performance_of_friendli_container":"3. Performance of Friendli Container compared to vLLM on a single NVIDIA A100 80GB GPU running AWQ-ed Mixtral 8x7B from Mistral AI with the following settings: mean input token length = 500, mean output token length = 150, mean request per second = 0.5. Evaluation conducted by FriendliAI.","testing_conducted_by_friendli_oct_2023":"1. Testing conducted by FriendliAI in October 2023 using Llama-2-13B running on Friendli Inference. See the detailed results and methodology here."},"auth":{"sign_out":"Sign out"},"container":{"back_to_repository":"Back to repository","back_to_specific_repository":"Back to {repositoryName}","check_our_docs_for_detailed_options":"Check our docs for detailed options, including examples for multi-GPU and multi-LoRA serving.","click_button_below_to_create":"Click the button below to create new secret.","container_image_is_only_valid":"The container image is only valid for {count} days and CANNOT be used for production. The container should be able to connect to the FriendliAI metering server.","container_secrets":"Container secrets","create_secret":"Create secret","create_secret_button":"Create secret","create_secret_disabled_team_role_not_privileged_tooltip":"Create secret requires a team role of Admin or higher.","created_at":"Created at","currently_used":"currently used","description":"Description","download_instructions":"Download instructions","during_free_trial":"During the 60-days free trial period, you can use registry.friendli.ai/trial:latest only.","find_repositories_by":"Find repositories by name","friendli_container_secrets":"Friendli Container secrets","generate_access_token":"Generate a Friendli Token (personal access token)","generate_access_token_description":"FRIENDLI_TOKEN (Personal access token) is the user credential for logging into our container registry.","generate_container_secret":"Generate a container secret","generate_container_secret_description":"Container secret is a credential to launch our Friendli Container images. You should pass the container secret as an environment variable to run the container image.","go_to_secrets_and_create_secret":"Go to Container > Container secrets and click ‘Create secret’","go_to_tokens_and_create_new_token":"Go to Personal settings > Tokens and click ‘Create new token’","login_to_friendli_registry":"Login to Friendli Container registry.","login_with_docker_client":"Login with Docker client","no_description_to_display":"No description to display","no_secrets_to_display":"No secrets to display","no_tags_to_display":"No tags to display","please_store_your_new_secret":"Please store your new secret in a secure place. You cannot see it again.","previously_used":"previously used","public":"Public","pull_image":"Pull image","quickstart":"Quickstart","quickstart_description":"Friendli Container enables you to effortlessly deploy your generative AI model on your machine. This quickstart will guide you through the process of running Friendli Container. Current version of Friendli Container supports all major generative AI models, including Llama 3.1, Mixtral, Mistral, Gemma 2, Phi-3.5, Qwen 2.5 and etc. Supported models","repository":"Repository","revoke":"Revoke","revoke_now":"Revoke now","revoke_secret":"Revoke secret","rotate":"Rotate","rotate_container_secret_description":"You can rotate the container secret for security reasons. If you rotate the container secret, a new secret will be created and the previous secret will be revoked automatically in 30 minutes.","rotate_secret":"Rotate secret","rotate_secret_disabled_team_role_not_privileged_tooltip":"Rotate secret requires a team role of Admin or higher.","run_container":"Run Friendli Container","save_your_created_token":"Save your created token value.","secret":"Secret","set_friendli_container_secret":"Set the FRIENDLI_CONTAINER_SECRET environment variable.","set_friendli_token":"Set the FRIENDLI_TOKEN environment variable.","single_gpu_hermes_3_llama_3_1_8b":"Running on a single GPU with the Hermes-3-Llama-3.1-8B model.","status":"Status","tags":"Tags","this_action_cannot_be_undone":"This action cannot be undone.\nThe previous secret will be revoked automatically in 30 minutes.","this_will_rotate_current_secret":"This will rotate the current secret with a new secret.\nThe current secret will be revoked automatically in 30 minutes.","updated":"Updated","updated_at":"Updated at","you_may_have_only_one_secret":"You may have only one secret at a time. If you want to create a new secret, you should rotate the previous secret with a new secret.\nThe previous secret will become invalid as you rotate it.","your_secret_is_revoked":"Your secret is revoked.","your_secret_is_rotated":"Your secret is rotated."},"dataset":{"adjust_ratio":"Adjust ratio","adjust_ratio_description":"Adjust how the selected splits are divided into training and validation sets.","api_reference":"API reference","assign_splits":"Assign splits","assign_splits_description":"Manually select separate splits for training and validation.","back_to_datasets":"Back to datasets","chat":"Chat","chat_with_image":"Chat with image","chat_with_image_api_reference_description":"Upload for chat with image datasets is available through the SDK only.","created":"Created","dataset":"Dataset","dataset_deleted":"Dataset deleted","dataset_file":"Dataset file","dataset_name":"Dataset name","dataset_name_updated":"Dataset name updated","dataset_split_deleted":"Dataset split deleted","dataset_split_name_updated":"Dataset split name updated","dataset_type":"Dataset type","datasets":"Datasets","delete_dataset_action_cannot_be_undone":"This action cannot be undone. This will permanently delete this dataset.","enter_dataset_name":"Enter dataset name","enter_dataset_name_to_delete_it":"Enter dataset name to delete it","enter_split_name":"Enter split name","example_code":"Example code","failed_to_delete_dataset":"Failed to delete dataset","failed_to_delete_dataset_split":"Failed to delete dataset split","failed_to_get_datasets":"Failed to get datasets","failed_to_load_preview":"Failed to load preview","failed_to_load_preview_description":"We couldn’t generate a preview of your dataset. Please try again in a moment.","failed_to_load_splits":"Failed to load splits","failed_to_load_splits_description":"We couldn’t generate splits of your dataset. Please try again in a moment.","failed_to_update_dataset_name":"Failed to update dataset name","failed_to_update_dataset_split_name":"Failed to update dataset split name","find_datasets_by_name":"Find datasets by name","fine_tune":"Fine-tune","new_dataset":"New dataset","no_dataset_searched":"No dataset searched","no_datasets_found_yet":"No datasets found yet.","no_preview_to_show_yet":"No preview to show yet","no_preview_to_show_yet_description":"It might appear once content is uploaded or ready.","no_splits_to_show_yet":"No splits to show yet","no_splits_to_show_yet_description":"Please upload a dataset using the button above.","number_of_rows":"Number of rows","option":"Option","overview":"Overview","please_type_to_confirm_dataset":"Please type ‘{datasetName}’ to confirm","preview":"Preview","previous_step":"Previous step","ratio":"Ratio","read_the_docs":"Read the docs","search_dataset":"Search dataset","select_a_dataset":"Select a dataset","select_a_split":"Select a split","select_splits":"Select splits","select_splits_for_training":"Select splits for training","select_splits_for_validation":"Select splits for validation","selected_dataset":"Selected dataset","set_train_validation_splits":"Set train / validation splits","split":"Split","split_by_ratio":"Split by ratio","split_by_ratio_description":"Divide one or more splits into train/validation using a ratio.","split_id":"Split ID","split_in_use_for_training_tooltip":"This split is in use for training and can’t be selected for validation.","split_in_use_for_validation_tooltip":"This split is in use for validation and can’t be selected for training.","split_name":"Split name","splits":"Splits","splits_are_not_selected":"Splits are not selected","splits_for_training":"Splits for training","splits_for_validation":"Splits for validation","train":"Train","training":"Training","type":"Type","upload_a_file_directly":"Upload a file directly","upload_a_new_dataset":"Upload a new dataset","upload_via_sdk":"Upload via SDK","validation":"Validation","view_format_guide":"View format guide"},"dedicated_endpoints":{"4_bit_online_quant_is_not_supported":"4-bit Online Quantization is not supported for the selected model.","4bit":"4BIT","8_bit_online_quant_is_not_supported":"8-bit Online Quantization is not supported for the selected model.","8bit":"8BIT","accelerate_generation_by_predicting_and_validating":"Accelerate generation by predicting\nand validating multiple tokens in parallel.","adapter":"Adapter","adapter_model":"Adapter model","adapter_models":"Adapter models","adapter_name":"Adapter name","adapters":"Adapters","add_count":"Add {count}","add_labels":"Add labels","add_lora_adapter":"Add LoRA adapter","add_lora_adapter_tooltip":"Friendli Dedicated Endpoints support multi-LoRA serving, allowing you to serve pre-trained LLMs with multiple fine-tuned adapters.","add_special_tokens":"Add special tokens","add_special_tokens_tooltip":"Whether or not to add special tokens in tokenization. Equivalent to Hugging Face Tokenizer's `add_special_tokens` argument.","adjusts_n_gram_size_to_balance":"Adjusts n-gram size to balance diversity,\ncache usage, and latency.","all_models":"All models","all_status":"All status","all_status_codes":"All status codes","apply_time_range":"Apply time range","archive":"Archive","archive_model":"Archive model","archive_project":"Archive project","archive_project_disabled_general_project_tooltip":"This project cannot be archived.","archive_project_disabled_team_role_not_privileged_tooltip":"Archiving projects requires a team role of Admin or higher.","archive_this_project_along_with":"Archive this project along with all of its resources.","automatically_scale_the_number_of_replicas":"Automatically scale the number of replicas within the minimum and maximum based on traffic levels. Configuring the minimum to 0 leads to a sleeping status.","autoscaling":"Autoscaling","autoscaling_configuration":"Autoscaling configuration","autoscaling_configuration_description":"Handle highly variable traffic while minimizing spend on idle compute resources.","autoscaling_type":"Autoscaling type","autoscaling_type_default_description":"We highly recommend using the Default autoscaling type, as it offers optimal performance for most workloads.","autoscaling_type_queue_description":"Queue delay scaling strategy adjusts worker numbers based on request wait times. With zero workers initially, the first request adds one worker.","autoscaling_type_request_description":"Request count scaling strategy adjusts worker numbers according to total requests in the queue and in progress.\nIt automatically adds workers as the number of requests increases, ensuring tasks are handled efficiently.","awake":"Awake","awake_now":"Awake now","awake_to_update":"Awake to update","awake_to_update_pending_description":"The update has been successfully requested and is currently pending. It will proceed once the endpoint is awake.\n\nIf you would like to update immediately, please click the ‘Awake now’ button below.","back_to_endpoint_detail":"Back to endpoint detail","back_to_endpoints":"Back to endpoints","back_to_finetuning":"Back to fine-tuning","back_to_uploaded_models":"Back to uploaded models","backbone":"Backbone","base_model":"Base model","base_model_hugging_face_model_hub":"Base model / Hugging Face model hub","base_model_id":"Base model ID","base_model_uploaded_model":"Base model / Uploaded model","base_model_weights_and_biases_model_artifact":"Base model / Weights & Biases model artifact","batch_size":"Batch size","batch_size_tooltip":"Total batch size used for training","calculator":"Calculate","cancel_job":"Cancel job","cancel_pending_update":"Cancel pending update","cancel_pending_update_description":"Are you sure you want to cancel the update?","cancel_update":"Cancel update","canceled":"Canceled","cannot_access_repo_error":"Please check if the used token is able to access the model repository and update it if necessary.","cannot_change_gpu_type_message":"Cannot change the GPU type.","change":"Change","changes":"changes","chat_data_example":"Chat data example","chat_data_requirements":"Chat data requirements checklist","chat_template_overridden":"Chat template overridden","checking":"Checking...","checking_for_requirements":"Checking for requirements...","click_the_button_to_add_hf_adapters":"Click the button above to add Hugging Face adapters.","clone_of_name":"Clone of {name}","comment":"Comment","comment_updated":"Comment updated","completed":"Completed","configuration":"Configuration","continue_update":"Continue update","cooldown_period":"Cooldown period","cooldown_period_description":"The time delay before scaling down an active replica.","cost_per_million_tokens":"Cost per million tokens","create":"Create","create_a_new_job":"Create a new job","create_an_endpoint":"Create an endpoint","create_an_endpoint_description":"Quickly deploy your own model from the Hugging Face repository or the models list.","create_new_endpoint":"Create a new endpoint","create_project":"Create project","created":"Created","created_at":"Created at","current":"current","current_version_will_roll_back_to_version":"Current {baseVersionName} will roll back to {targetVersionName}.","custom_chat_template":"Custom chat template","custom_chat_template_change_file":"Change file","custom_chat_template_choose_file":"Choose file","custom_chat_template_drag_drop_or":"Drag and drop your file here or","custom_chat_template_editor_size_exceeded":"Input size exceeds limit. Please shorten your content to be under 1MB.","custom_chat_template_invalid_content":"Invalid content. Please input a valid Jinja template.","custom_chat_template_not_supported_model":"The selected model does not support chat templates.","custom_chat_template_remove_tooltip":"Remove a overridden chat template","custom_chat_template_tooltip":"Provide a Jinja chat template to override the model's default conversation formatting.","custom_chat_template_upload_file_hint":"Only text files. Max size 1MB.","custom_chat_template_upload_size_exceeded":"File size exceeds limit. Please upload a file under 1MB.","custom_chat_template_view_format_guide":"View format guide","danger_zone":"Danger zone","dataset":"Dataset","dataset_requirements":{"file_upload":"Drag and drop .jsonl file here or click to browse from your computer.","jsonl_format":"You’ll need to have your data in .jsonl file format. Each JSON line consists of a “messages” array of objects.","message_content":"Every messages array must contain at least one message object\n({\"role\": ..., \"content\": ...})."},"dedicated_endpoints":"Dedicated endpoints","default":"Default","delay_time":"Delay time","delete":"Delete","delete_endpoint":"Delete endpoint","delete_endpoint_action_cannot_be_undone":"This action cannot be undone. This will permanently delete this endpoint.","delete_error":"Failed to delete","delete_finetuning_action_cannot_be_undone":"This action cannot be undone. This will permanently delete this fine-tuning job.","deploy":"Deploy","development":"Development","disabled":"Disabled","download":"Download","downloading_model":"Downloading model","drag_and_drop_file_here_or_click_to_browse_from_your_computer":"Drag and drop file here or click to browse from your computer.","duplicate":"Duplicate","duplicate_a_job":"Duplicate a job","edit":"Edit","edit_engine_configuration":"Edit engine configuration","editor":"Editor","elapsed_time":"Elapsed time","enabled":"Enabled","endpoint":"Endpoint","endpoint_cancel_update_no_update_to_cancel_error":"The endpoint has no updating version to cancel.","endpoint_cancel_update_processed_beyond_cancellation_error":"The update has progressed beyond the point of cancellation.","endpoint_deleted_success":"Endpoint deleted","endpoint_encountered_an_error":"Endpoint encountered an error","endpoint_features":"Endpoint features","endpoint_health":"Endpoint health","endpoint_id":"Endpoint ID","endpoint_name":"Endpoint name","endpoint_name_mismatch":"Enter endpoint name to delete it","endpoint_name_updated":"Endpoint name updated","endpoint_of_finetuning_name":"Endpoint of {finetuningName}","endpoint_pending_awaking_info_message":"The update has been successfully requested and is currently pending. It will proceed once the endpoint is awake.","endpoint_pending_initializing_info_message":"The update has been successfully requested and is currently pending. It will proceed after initializing the endpoint.","endpoint_rollback_already_has_next_version_error":"The endpoint is already rolling out or has pending next version.","endpoint_rollback_has_insufficient_info_error":"The specified version passed beyond the point of restoration.","endpoint_rollback_initializing_error":"The endpoint is currently initializing, so cannot be updated.","endpoint_rollback_invalid_version_error":"The specified version is not valid for rollback operation.","endpoint_rollback_no_such_version_error":"The specified version does not exist.","endpoint_rollout_already_has_next_version_error":"The endpoint is already rolling out or has pending next version.","endpoint_rollout_initializing_error":"The endpoint is currently initializing, so cannot be updated.","endpoint_status_awaking":"WAKING UP","endpoint_status_failed":"FAILED","endpoint_status_initializing":"INITIALIZING","endpoint_status_ready":"READY","endpoint_status_running":"RUNNING","endpoint_status_sleeping":"SLEEPING","endpoint_status_stopping":"STOPPING","endpoint_status_terminated":"TERMINATED","endpoint_status_terminating":"TERMINATING","endpoint_status_unknown":"UNKNOWN","endpoint_status_updating":"UPDATING","endpoint_type":"Endpoint type","endpoint_update_cannot_access_repo_error":"Unable to access the repository.","endpoint_update_internal_error":"Internal system error occurred.","endpoint_update_internal_unknown_error":"Unknown internal error occurred.","endpoint_update_invalid_argument_error":"Invalid argument provided.","endpoint_update_invalid_token_error":"Authentication token is invalid or expired.","endpoint_update_memory_error":"Out of memory.","endpoint_updating":"Endpoint updating...","endpoint_url":"Endpoint URL","endpoints":"endpoints","endpoints_tab":"Endpoints","engine_configuration":"Engine configuration","engine_initializing":"Engine initializing","enter_endpoint_name":"Enter endpoint name","enter_finetuning_name":"Enter fine-tuning name","enter_hugging_face_adapter_repo_name":"Enter Hugging Face adapter's repository name (ex. FriendliAI/adapter)","enter_model_name":"Enter model name","enter_the_project_name":"Enter the project name","estimated_time_left":"Estimated time left","eval_steps_tooltip":"The number of steps between evaluation of the model using the validation set. If set to 0, there will be no evaluation.","evaluation_steps":"Evaluation steps","failed":"Failed","failed_to_load_adapter_list":"Failed to load adapter list","features":"Features","features_unknown_due_to_custom_template_tooltip":"This information is unavailable because the chat template is overridden for this endpoint, and tool calling and reasoning parser behavior depend on how your custom template operates.","file_does_not_meet_requirements":"File does not meet requirements.","file_type_is_not_supported_only_jsonl_files_allowed":"File type is not supported. Only .jsonl files are allowed.","files":"Files","filter":"Filter","find_endpoints_by":"Find endpoints by name","find_jobs_by":"Find jobs by name","find_uploaded_models_by":"Find uploaded models by name","finetuning":"Fine-tuning","finetuning_deploy_tooltip_message":"Once the output model (adapter) is generated, you can deploy the job.","finetuning_job_deleted_success":"Fine-tuning job deleted","finetuning_job_duplicated":"Fine-tuning job duplicated","finetuning_name_mismatch":"Enter fine-tuning job name to delete it","finetuning_name_updated":"Fine-tuning job name updated","finetuning_phase_cannot_access_repo":"Please check if the used token is able to access the model repository and update it if necessary. You can click 'Duplicate' to start a new job from the previous setting.","finetuning_phase_internal_error":"Please try again later. If the issue keeps happening, contact support.","finetuning_phase_invalid_dataset":"The used dataset format is not currently supported. Please try using a different format. You can click 'Duplicate' to start a new job from the previous setting.","finetuning_phase_invalid_model":"The requested model is not currently supported. Please try using a different model. You can click 'Duplicate' to start a new job from the previous setting.","finetuning_phase_invalid_token":"Please check if the used token is valid and update it if necessary. You can click 'Duplicate' to start a new job from the previous setting.","finetuning_phase_memory_error":"CUDA Ouf-of-Memory Error occurred.","finetuning_status_canceled":"CANCELED","finetuning_status_completed":"COMPLETED","finetuning_status_failed":"FAILED","finetuning_status_initializing":"INITIALIZING","finetuning_status_training":"TRAINING","finetuning_status_unknown":"UNKNOWN","formatted":"Formatted","gated_model":"GATED","general":"General","healthy":"Healthy","hf_model_architecture_not_supported_message":"The architecture is not supported.","hf_model_checking_model_compatibility_message":"Checking model compatibility...","hf_model_dont_have_access_message":"You don't have access to this gated model. Please request approval from the repository.","hf_model_dtype_not_supported_message":"Model dtype not supported.","hf_model_gathering_model_information":"Gathering model information...","hf_model_granted_message":"You have been granted access to this model.","hf_model_granted_with_dtype_casted_message":"You have been granted access to this model. This model will run as bfloat16.","hf_model_hf_api_error_message":"Hugging Face API error.","hf_model_need_approval_message":"You don't have access to this gated model. Please request approval from the repository.","hf_model_need_to_integrate_message":"To access a gated model, you need to integrate with Hugging Face. Click the button above to begin the integration.","hf_model_not_found_message":"Model not found.","hf_model_not_supported_message":"Model not supported.","hf_model_quantization_not_supported_message":"Unsupported quantization scheme.","hf_model_repository_is_invalid_message":"The repository is invalid.","hf_model_rope_scaling_not_supported_message":"Unsupported rope scaling type.","hf_model_size_not_supported_message":"Model size not supported.","hf_model_update_your_access_token_message":"Can't access the repository. Please check if the repository exists and is accessible with your Hugging Face access token.","history":"History","hugging_face":"Hugging Face","hugging_face_adapters":"Hugging Face adapters","hugging_face_model":"Hugging Face model","hugging_face_model_hub":"Hugging Face model hub","hugging_face_model_repository_name":"Hugging Face model repository name (e.g. microsoft/phi-4)","hyperparameters":"Hyperparameters","initial_replica":"Initial replica","initial_replica_description":"When the minimum is set to 0, the initial replica is 1; otherwise, it is the same as the minimum.","initializing":"Initializing","initializing_gpu":"Initializing GPU","instance_memory_insufficient_message":"For higher memory instances, please contact us.","instance_type":"Instance type","instance_update_disabled_tooltip":"The instance type cannot be changed once the endpoint has been created.","internal_unknown_error":"Please try again later. If the issue keeps happening, contact support.","invalid_adapter_route_error_message":"Only latin letters (A-Z, a-z), numbers (0-9), and underscore (_) are allowed.","invalid_argument_error":"The requested model is not currently supported. If you have any questions or need further assistance, contact support.","invalid_token_error":"Please check if the used token is valid and update it if necessary.","job_name":"Job name","job_progress":"Job progress","kv_cache_size":"KV cache size","last_deployment":"Last deployment","learn_more":"Learn more","learn_more_in_guide":"Learn more in guide.","learning_rate":"Learning rate","learning_rate_tooltip":"The initial learning rate for AdamW optimizer.","loading":"Loading","log_request_content":"Log request content","log_request_content_tooltip":"If disabled, the contents of inference requests are not logged.","logs":"Logs","lora_alpha":"LoRA alpha","lora_alpha_tooltip":"Scaling factor that determines the influence of the low-rank matrices during fine-tuning.","lora_dropout":"LoRA dropout","lora_dropout_tooltip":"Dropout rate applied during fine-tuning.","lora_r_tooltip":"The rank of the lora parameters","lora_rank":"LoRA rank","low_memory_instance_with_quant_off_warning":"The GPU memory of this instance may be low for the selected model.\nTurn on ‘Online Quantization’ option or change the model.","low_memory_instance_with_quant_off_warning_with_model_change":"The GPU memory of this instance may be low for the selected model.\nChange the model or instance type.","low_memory_tag":"LOW MEMORY","markdown_is_supported":"Markdown is supported","max":"Max","max_file_size_1gb":"Maximum file size: 1 GB","max_file_size_1gb_warning":"Maximum file size for file uploads is 1.0 GB.","max_input_length":"Max input length","max_input_length_tooltip":"Maximum input length to use with the prompt.","max_ngram_size":"Max n-gram size","maximum_batch_size":"Maximum batch size","maximum_batch_size_tooltip":"Maximum number of items that can be processed together. Using default value(=256) is highly recommended.","maximum_n_gram_size":"Maximum n-gram size","members":"Members","memory_error":"The requested model does not fit in the requested GPU. Please use a smaller model or increase the number of GPUs.","metrics":"Metrics","min":"Min","min_tokens_disabled_message":"'min_tokens' option is currently disabled when tools are enabled","modalities":"Modalities","mode":"Mode","model":"Model","model_detail":"Model detail","model_does_not_support_vision_dataset_message":"The dataset includes images yet the model does not support vision inputs.","model_has_alternative_model":"We’ve updated some of the model’s metadata to ensure compatibility with our engine. View the changes or use the original model without updates.","model_has_remote_warning":"This repository uses Python files, which may lead to unforeseen issues. We recommend reaching out to us for the best experience.","model_has_remote_warning_and_endpoint_failed":"The model may have failed to function as expected because it relies on Python files which are not downloaded by default for security reasons.\nIf you have any questions, or would like to request a manual review of the model, please contact support.","model_incompatible_with_current_instance_message":"The selected model is incompatible with the current instance. Please choose a different model.","model_max_context_length":"Model max context length","model_max_context_length_tooltip":"Potential performance degradation\ndue to KV cache limits. Learn more","model_name":"Model name","model_repository":"Model repository","model_repository_cannot_be_found":"Model repository cannot be found.","model_revision":"Model revision","multi_lora":"Multi-LoRA","n_gram_spec_decoding":"N-gram speculative decoding","n_gram_spec_decoding_description":"Accelerate generation by predicting and validating multiple tokens in parallel. Learn more in guide and blog.","new_endpoint":"New endpoint","new_job":"New job","no_adapter_added":"No adapter added","no_adapter_models_to_display":"No adapter models to display","no_logs_for":"No logs for","no_logs_found":"No logs found yet","no_models_have_been_uploaded_yet":"No models have been uploaded yet.","no_preset_searched":"No preset searched","no_quantity":"No quantity","no_repositories_match_your_search":"No repositories match your search","not_available":"Not available","not_now":"Not now","nothing_to_show":"Nothing to show","num_gpu":"Number of GPUs","num_train_epochs_tooltip":"Total number of training epochs to perform (if not an integer, will perform the decimal part percents of the last epoch before stopping training).","number_of_gpus":"Number of GPUs","number_of_replicas":"Number of replicas","number_of_requests":"Number of requests","number_of_requests_description":"Adds instances when delayed requests exceed the threshold.","number_of_tokens":"Number of tokens","number_of_training_epochs":"Number of training epochs","off":"Off","online_quantization":"Online Quantization","online_quantization_description":"Improves serving efficiency with our proprietary quantization method. Learn more in guide and blog.","online_quantization_tooltip":"Improves serving efficiency,\nwith our proprietary quantization method.","optional":"optional","output":"Output","output_models":"Output models","overall_traffic":"Overall traffic","overridden_chat_template":"Overridden chat template","override":"Override","overview":"Overview","parameters":"parameters","parameters_tab":"Parameters","paste_template":"Paste template","paste_your_chat_template":"Paste your chat template","pending":"pending","playground":"Playground","please_accept_the_terms":"Please accept the terms and conditions of the model.","please_check_requirements_and_reupload":"Please check the requirements and re-upload the file.","please_check_the_model_repository":"Please check the model repository name or Hugging Face access token and try again.","please_select_a_model_first":"Please select a model first","please_try_again":"Please try again later.","please_type_model_name":"Please type ‘{modelName}’ to confirm","please_type_to_confirm":"Please type ‘{projectName}’ to confirm","please_type_to_confirm_endpoint":"Please type ‘{endpointName}’ to confirm","please_type_to_confirm_job":"Please type ‘{finetuningName}’ to confirm","preview":"Preview","processed_requests":"Processed requests","processed_tokens":"Processed tokens","production":"Production","project":"Project","project_adapters":"Project adapters","project_has_been_created":"‘{projectName}’ has been created.","project_id":"Project ID","project_name":"Project name","project_name_duplicated_error_message":"A project named ‘{projectName}’ already exists in your team. Try another name.","project_overview":"Project overview","python_interpreter":"Run python code","queue_delay":"Queue delay","queue_delay_description":"Adds instances if a request isn’t processed within the delay time.","reasoning":"Reasoning","reasoning_not_supported_with_tool_call_tooltip":"Our system was not able to detect a common reasoning token. Tool calls made during reasoning will be parsed. If you think this is a mistake, please contact us.","reasoning_not_supported_without_tool_call_tooltip":"Our system was not able to detect a common reasoning token. If you think this is a mistake, please contact us.","reasoning_parser":"Reasoning parser","reasoning_parser_tooltip":"When enabled, a separate `reasoning_content` field will include the reasoning process instead of being included in the `content` field. See the response example to learn how the separation works. Notably, the behavior can be overridden by setting the `parse_reasoning` parameter in the request, so this setting only determines the default behavior. Learn more in guide.","reasoning_schema":"Reasoning schema","reasoning_supported_with_tool_call_tooltip":"A common reasoning token was detected. Tool calls made during reasoning will not be parsed.","reasoning_supported_without_tool_call_tooltip":"A common reasoning token was detected.","recently_uploaded":"Recently uploaded","replicas":"Replicas","repository":"Repository","req":"req","request_count":"Request count","request_id":"Request ID","request_latency":"Request latency","request_latency_last_24_hours":"Request latency (last 24 hours)","request_method":"Request method","required":"required","response_example":"Response example","response_time":"Response time","retry":"Retry","revision_select_placeholder":"Select a {variant} first.","rollback":"Rollback","rollback_endpoint":"Rollback endpoint","rollback_endpoint_description":"Are you sure you want to rollback the endpoint configurations? This action may revert current settings to previous states.","route":"Route","route_tooltip":"Use this value in your inference request to specify which adapter model should handle your request.","running":"Running","running_out_of":"{curr} running out of {total}","search_by_adapter_name":"Search by adapter name","search_by_model_name":"Search by model name","search_logs":"Search log by request ID or log content","search_preset":"Search preset","search_the_web":"Search the web","search_the_web_linkup":"Search the web (Linkup)","searched_logs_not_return":"Search by full request ID, or try a different request ID or log content.","sec":"sec","seconds":"seconds","select_a_model_to_deploy":"Select a model to deploy","select_dataset":"Select dataset","select_quantization_mode":"Select a quantization mode. Using fewer bits improves performance\nand computational demand with negligible quality impact.\nAvailable GPU options may differ depending on the mode.","select_revision":"Select revision","selected_model_does_not_support_n_gram_spec_decoding_message":"The selected model does not support N-gram speculative decoding","selected_model_does_not_support_online_quantization_message":"The selected model does not support Online Quantization","selected_model_does_not_support_online_quantization_message_with_adapters":"Online Quantization does not support LoRA adapters","show_current_version":"Show current version","skip_special_tokens":"Skip special tokens","skip_special_tokens_tooltip":"Whether or not to remove special tokens in detokenization. Equivalent to Hugging Face Tokenizer's `skip_special_tokens` argument.","sources":"sources","start_endpoint":"Start endpoint","start_with_free_credits":"Start with free credits","support_for_this_model_beta_tooltip":"Support for this model in currently in beta.","switch_revisions":"Switch revisions","temporarily_unavailable_gpu_resources":"GPU resources are temporarily unavailable. Please try again soon.","terminate":"Terminate","this_autoscaling_type_is_only_available_for_enterprise_plans":"This autoscaling type is only available for Enterprise plans.","this_endpoint_will_be_terminated":"This endpoint will be terminated immediately so future requests will fail. You can restart this endpoint any time.","this_file_meets_all_the_requirements":"This file meets all the requirements.","this_finetuning_will_be_canceled":"This will cancel this fine-tuning job immediately. You cannot resume this fine-tuning job.","this_instance_does_not_support_online_quantization":"This instance doesn’t support Online Quantization.\nTurn off Online Quantization to use this instance","this_model_is_created_by":"This model is created by","this_route_is_already_in_use":"This route is already in use.","tight_memory_tag":"TIGHT MEMORY","timeline":"Timeline","timestamp":"Timestamp","tokens":"tokens","too_many_files_only_one_file_allowed":"Too many files. Only one file is allowed.","tool_call":"Tool call","tool_call_not_supported_tooltip":"Tool call capabilities may be limited, likely due to the model itself. If this seems incorrect, feel free to contact us.","tool_calling":"Tool calling","tools":"Tools","tools_tab":"Tools","tools_tooltip_description":"Automatically calls the appropriate tools to perform tasks based on your message","total_number_of_requests":"Total number of requests","total_number_of_training":"Total number of training","total_token_usage":"Total token usage","training":"Training","training_steps":"Training steps","training_steps_tooltip":"If set to a positive number, the total number of training steps to perform. For a finite dataset, training is reiterated through the dataset (if all data is exhausted) until 'Training steps' is reached.","trending_models":"Trending models","try_out_new_tools":"Try out new tools","unable_to_access_gated":"Unable to access gated model repository.","unable_to_display_content":"Unable to display content","unable_to_display_content_unexpected_error":"We are unable to display content due to an unexpected error.","unable_to_display_file":"Unable to display the file","unable_to_display_file_description":"We are unable to display the file because its size is too large.\nYou can only view files less than {fileSize}.","unable_to_display_logs":"Unable to display logs","unable_to_load_data":"Unable to load data","unformatted":"Unformatted","unhealthy":"Unhealthy","unknown":"UNKNOWN","unknown_error":"Unknown error","unwrap_lines":"Unwrap lines","update":"Update","update_canceled":"Update canceled","update_endpoint_configuration":"Update endpoint configuration","update_endpoint_will_run_using_your_api_key_message":"Upon updating the model, the endpoint will run using your API key instead of the creator's one.","update_endpoint_will_run_using_your_token_message":"Upon updating the model, the endpoint will run using your token instead of the creator's one.","update_engine_configuration":"Update engine configuration","update_failed":"Update failed","upgrade_your_plan_to_unlock_this_feature":"Upgrade your plan to unlock this feature","upload":"Upload","upload_file":"Upload file","uploaded":"uploaded","uploaded_model":"Uploaded model","uploaded_models":"Uploaded models","usage":"Usage","usage_breakdown":"Usage breakdown","version_comment":"Version comment","versions":"Versions","view_all":"View all","view_configs":"View configs","view_less":"View less","view_response_example":"View response example","wake":"Wake","wandb_model_architecture_not_supported_message":"The architecture is not supported.","wandb_model_artifact":"W&B model artifact","wandb_model_artifact_is_invalid_message":"The artifact is invalid.","wandb_model_checking_access_permissions_message":"Checking access permissions...","wandb_model_granted_message":"You have been granted access to this model.","wandb_model_need_to_integrate_message":"To access a model, you need to integrate with Wandb. Click the button above to begin the integration.","wandb_model_update_your_api_key_message":"Can't access the artifact. Please check if the artifact exists and is accessible with your Wandb API key.","we_are_unable_to_load":"We are unable to load due to network connectivity issues or errors. Please try again later.","weights_and_biases":"Weights & Biases","weights_and_biases_model_artifact":"Weights & Biases model artifact","weights_and_biases_model_artifact_full_name":"Weights & Biases model artifact full name","weights_and_biases_project":"Weights & Biases project","when_then_model_is_archived":"When the model is archived, it will no longer be visible in the model list.","wrap_lines":"Wrap lines","you_can_only_select_one_adapter":"You can only select one adapter","your_search_filters_not_return":"Your search and filter did not return any results."},"finetuning":{"advanced":"Advanced","basic":"Basic","integrations":"Integrations","wandb_project":"W&B project","weights_and_biases_project":"Weights & Biases project"},"inference":{"reasoning":"Reasoning"},"landing":{"active_endpoints":"Active endpoints","add_team_members":"Add team members","browse_all_models":"Browse all models","browse_models":"Browse models","changed":"changed","contact_team_owner":"Contact team owner","create_a_project":"Create a project","create_an_endpoint":"Create an endpoint","create_endpoint":"Create endpoint","create_one_to_get_started":"Create one to get started.","created":"created","customize_a_model_with_your_own_data":"Customize a model with your own data.","dedicated_endpoint":"Dedicated endpoint","dedicated_endpoints":"Dedicated endpoints","endpoints":"Endpoints","explore_models":"Explore models","failed_to_get_endpoints":"Failed to get endpoints","failed_to_get_recent_activities":"Failed to get recent activities","failed_to_get_usage":"Failed to get usage","fine_tune_a_model":"Fine-tune a model","fine_tune_model":"Fine-tune model","fine_tuning":"Fine-tuning","free_credit":"Free credit","get_started_with_friendli_suite":"Get started with Friendli Suite","hide_activities":"Hide activities","hugging_face_integration":"Hugging Face integration","interact_with_your_endpoint_in_real_time":"Interact with your endpoint in real time.","monthly":"monthly","new":"New","no_endpoints_found":"No endpoints found","no_endpoints_found_description":"Create one to get started.","no_models_found":"No models found","no_models_found_description":"There are currently no models available. This might be due to an unexpected error. Please try again later.","no_project_access":"No project access","no_project_searched":"No project searched","no_projects":"No projects","no_recent_activities_found":"No recent activities found.","recent_activities":"Recent activities","restarted":"restarted","search_projects":"Search projects","simply_deploy_a_model_for_api_use":"Simply deploy a model for API use.","terminated":"terminated","test_endpoints_in_playground":"Test endpoints in playground","to_do":"To do","upgrade":"Upgrade","usage":"Usage","view_all_activities":"View all activities","view_details":"View details","view_usage":"View usage","was_awakened":"was awakened","was_changed":"was changed","was_created":"was created","was_restarted":"was restarted","was_terminated":"was terminated","welcome_to_friendli":"Welcome to Friendli"},"layout":{"access_tokens":"Access Tokens","all_teams":"All teams","billing":"Billing","create_project":"Create project","documentation":"Documentation","general":"General","home_page":"Home page","members":"Members","no_teams_found":"No teams found","personal_settings":"Personal settings","project":"Project","project_settings":"Project settings","projects":"Projects","setting":"Setting","switch_project":"Switch project","switch_team":"Switch team","team":"Team","team_overview":"Team overview","team_settings":"Team settings","teams":"Teams","this_team_has_no_projects":"This team has no projects."},"serverless_endpoints":{"api":"API","api_identifier":"API identifier","api_usage":"API usage","back_to_serverless_endpoints":"Back to Serverless Endpoints","built_in_tool_call_not_supported_tooltip":"Built-in tools are not available with this endpoint.","built_in_tool_call_supported_tooltip":"Built-in tools (e.g., code interpreter, search) are available with this endpoint in the playground.","built_in_tools":"Built-in tools","cold":"Cold","context_length":"Context length","cooling_down":"Cooling down","endpoint_name":"Endpoint name","failed_to_get_endpoints":"Failed to get endpoints","features":"Features","find_endpoints_by":"Find endpoints by name","frozen":"Frozen","get_friendli_token":"Get Friendli Token","input":"Input","license":"License","linkup_search_tooltip":"For your API/SDK usage, integrate with Linkup here.","modalities":"Modalities","model":{"code_copy":"Copy code","examples":"Examples","markdown":"Markdown","report":"Report"},"model_card":"Model card","model_details":"Model details","model_provider":"Model provider","more_information":"More information","no_serverless_endpoints_found_yet":"No serverless endpoints found yet.","no_serverless_endpoints_searched":"No serverless endpoints searched","output":"Output","overview":"Overview","parameters":"Parameters","price":"Price","price_tooltip":"We offer two pricing models: pinned models are billed per token, while others are charged based on compute time. Learn more","pricing":"Pricing","pricing_high_to_low":"Pricing: High to low","pricing_low_to_high":"Pricing: Low to high","reasoning":"Reasoning","reasoning_not_supported_with_tool_call_tooltip":"Our system was not able to detect a common reasoning token. Tool calls made during reasoning will be parsed. If you think this is a mistake, please contact us.","reasoning_not_supported_without_tool_call_tooltip":"Our system was not able to detect a common reasoning token. If you think this is a mistake, please contact us.","reasoning_supported_with_tool_call_tooltip":"A common reasoning token was detected. Tool calls made during reasoning will not be parsed.","reasoning_supported_without_tool_call_tooltip":"A common reasoning token was detected.","search_endpoint_by_model_or_endpoint_name":"Search endpoint by model or endpoint name","serverless_endpoints":"Serverless endpoints","status":"Status","status_tooltip":"Endpoint status shows its readiness: Warm (ready), Warming up, Cooling down, or Cold (inactive).","tool_call":"Tool call","tool_call_not_supported_tooltip":"Tool call capabilities may be limited, likely due to the model itself. If this seems incorrect, feel free to contact us.","trending":"Trending","try_in_playground":"Try in playground","unknown":"Unknown","warm":"Warm","warming_up":"Warming up"},"settings":{"account":"Account","achieve_higher_performance_with_dedicated_infrastructure":"Achieve higher performance with dedicated infrastructure","activating_your_plan":"Activating your plan","add_more":"Add more","add_payment_method":"Add payment method","admin":"Admin","admin_description":"Admin-level access to the entire team","all_team_roles":"All team roles","api_tokens":"API tokens","are_you_sure_you_want_to_delete_payment":"Are you sure you want to delete this payment method?","billing":"Billing","billing_overview":"Billing overview","brand":"Brand","build_your_own_models":"Build your own models","cancel":"Cancel","click_the_button_above_to_create_new_token":"Click the button above to create new token.","contact_us":"Contact us","contact_us_at_support_friendli_ai":"Contact us at support@friendli.ai","create":"Create","create_project":"Create project","create_token":"Create token","create_token_info":"Make sure to copy your personal access token now because you will not be able to see this again after refreshing the page.","created_at":"Created at","credit_change":"Credit change","current_password":"Current password","current_tier":"Current tier","current_tier_description":"Your team is currently on the {plan} (Tier {tier}).\nUsage limits will automatically increase upon reaching the next tier within your current plan.","current_tier_max_description":"Your team is currently on the {plan} (Tier {tier}) — the highest tier available in this plan.\nConsider upgrading to a Dedicated Endpoint.","custom":"Custom","date":"Date","default":"Default","default_project":"Default project","default_project_tooltip":"The project that will be used as your default project for access and activity.","default_team":"Default team","default_team_description":"If you belong to multiple teams, this setting controls which team is used by default when making requests with the Personal Access Tokens above. Change default team","default_team_tooltip":"The team to which API requests are charged if none is specified. Learn more","delete":"Delete","detail":"Detail","edit":"Edit","email":"Email","email_address":"Email address","ending_in_card_number":"ending in {number}","enter_current_password":"Enter current password","enter_free_credit_code":"Enter free credit code","enter_full_name":"Enter full name","enter_new_password":"Enter new password","enter_team_name":"Enter team name","enter_your_free_credit_code":"Enter your free credit code","error_role_update":"Failed to update team role","expiration_date":"Expiration date","expired_date":"Expired {month}/{year}","expired_on":"Expired on","expires":"Expires","explore_dedicated_endpoints":"Explore Dedicated Endpoints","feature_request_and_feedback":"Feature requests & Feedback","free_coupon_applied":"Free Coupon Applied!","free_coupon_code":"Free coupon code","free_coupon_success_message":"You've received ${creditAmount} free credits for {productName}.","free_credit_code":"Free credit code","friendli_suite_products":"Friendli Suite products","friendli_tokens":"Friendli tokens (Personal access tokens)","friendli_tokens_description":"Your personal access tokens are listed below. It is mainly referred to as a key called FRIENDLI_TOKEN.\nPlease note that we do not display your tokens again after you generate them.","full_name":"Full name","general":"General","got_it":"Got it","handle_higher_volumes_of_inference":"Handle higher volumes of inference","have_questions_please_feel_free_to_contact_us":"Have questions? Please feel free to contact us.","increase_your_usage_limits":"Increase your usage limits","integrations":"Integrations","invitations":"Invitations","invite":"Invite","invite_members":"Invite members","last_four_number":"Last 4 number","learn_more":"Learn more","make_default_payment":"Make default payment","make_default_project":"Make default project","make_default_team":"Make default team","manage_the_role_assigned":"Manage the role assigned to {name} ({email}) within the team.","max_token_info":"You cannot create more than {maxCount} tokens.\nPlease delete tokens and try again.","member":"Member","member_description":"Central to the team's operational functionality","members":"Members","members_invited_to_your_team":"{totalCount} members invited to your team","my_projects":"My projects","my_teams":"My teams","name":"Name","name_is_updated":"Name is updated.","need_higher_rate_limits":"Need higher rate limits?","new_password":"New password","next_tier":"Next tier","no_created_date":"No created date","no_default_team_exist":"Default team does not exist","no_expiration":"No expiration","no_members_match_your_search":"No members match your search","no_members_match_your_search_description":"Your search and filter did not return any results.","no_projects":"No projects","no_teams":"No teams","no_tokens_to_display":"No tokens to display","output":"output","owner":"Owner","owner_description":"Owner-level access to the entire team","password":"Password","password_is_updated":"Password is updated.","patents":"Patents","payment_method":"Payment method","pending":"PENDING","personal":"Personal","personal_settings":"Personal settings","policies":"Policies","privacy_policy":"Privacy Policy","profile_image":"Profile image","project_id":"Project ID","project_is_set_to_default_project":"‘{projectName}’ is set to default project.","project_name":"Project name","project_settings":"Project settings","projects":"Projects","qualifications":"Qualifications","qualifications_tooltip":"Only applies to usage within Serverless Endpoints plan.","rate_limits_description":"To increase rate limits for your team, you need to add a payment method. Once added, your team’s limits will automatically be increased. Click the button above to add a payment method.","redeem_free_coupon":"Redeem free coupon","remove":"Remove","remove_member":"Remove member","remove_member_description":"Are you sure you want to remove {removeTarget}? This can't be undone.","remove_member_invitation_description":"Are you sure you want to remove {removeTarget} from the invitation? This can't be undone.","resend_invitation":"Resend invitation","reset":"Reset","role":"Role","role_updated":"Team role updated","save":"Save","search_project":"Search project","search_team":"Search team","search_team_members":"Search team members","serve_custom_models":"Serve custom models","service_level_agreement":"Service Level Agreement","settings":"Settings","status":"Status","team":"Team","team_id":"Team ID","team_is_set_to_default_team":"‘{teamName}’ is set to default team.","team_members":"Team members","team_name":"Team name","team_overview":"Team overview","team_profile_image":"Team profile image","team_role":"Team role","team_settings":"Team settings","teams":"Teams","terms_of_service":"Terms of Service","third_party_services":"Third-party services","this_month_estimate":"This month's estimate","this_month_estimate_tooltip":"Your monthly usage from the 1st through the end of each month will be charged on the 5th of the next month.","tier":"Tier","tiers":"Tiers","to_reach_the_next_tier_description":"To reach the next tier, you’ll need to meet the criteria listed in the table below. Once the criteria are met, your account will be automatically upgraded.","token":"Token","token_id":"Token ID","token_is_created":"Personal access token is created.","token_is_deleted":"Personal access token is deleted.","token_length":"Token length","tokens":"Tokens","total_historical_spend_of_value":"Total historical spend of ${value}+","update":"Update","usage":"Usage","usage_limits":"Usage limits","valid_payment_method_added":"Valid payment method added","view":"View","view_invoices":"View Invoices","want_to_learn_more_about_rate_limits":"Want to learn more about rate limits?","why_switch_to_dedicated_endpoint":"Why switch to Dedicated Endpoint?","you":"You","you_can_pass_header":"You can pass a header to specify which team is used for an API request. If the team is not specified, your API request will be charged on your default team.","you_have_reached_the_limit_of_your_current_plan":"You’ve Reached the Limit of Your Current Plan","your_profile":"Your profile","your_team_have_not_added_payment_method_yet":"Your team has not added a payment method yet."},"shared":{"account":"Account","add":"Add","additional_settings":"Additional settings","api_key":"API key","archive":"Archive","beta_tag":"BETA","by_user":"by {username}","cancel":"Cancel","change":"Change","clear_chat":"Clear chat","close":"Close","contact_us":"Contact us","copied":"Copied","create":"Create","created":"Created","created_at_datetime":"Created at {datetime}","created_datetime":"Created {datetime}","created_datetime_by_user":"Created {datetime} by {username}","current":"current","datetime_by_user":"{datetime} by {username}","default":"Default","delete":"Delete","deploy":"Deploy","edit":"Edit","end":"End","error":"Error","error_tag":"ERROR","format":"Format","free":"Free","generate":"Generate","got_it":"Got it","gpu":"GPU","hugging_face":"Hugging Face","hugging_face_access_token":"Hugging Face access token","hugging_face_access_token_saved":"Hugging Face access token saved","hugging_face_integration":"Hugging Face integration","hugging_face_integration_description":"To connect your Hugging Face account, you need to register your Hugging Face access token. You can generate an access token on Hugging Face at this link.","hugging_face_update_description":"You can generate an access token on Hugging Face at this link.","inference_upload_file_tooltip":"Upload file (.TXT or .PDF, max 10MB)","inference_upload_image_tooltip":"Upload image file (max 10MB)","info":"Info","input":"Input","integrate":"Integrate","integrated_tag":"INTEGRATED","invalid_key_try_again":"Invalid key. Please try again with another key.","invalid_token_try_again":"Invalid token. Please try again with another token.","last_updated":"Last updated","last_updated_datetime_by_user":"Last updated {datetime} by {username}","linkup_api_key":"Linkup API key","linkup_integration_description":"To connect your Linkup account, you need to register your Linkup API key. You can find your Linkup API key at this link.","linkup_integration_has_been_completed":"Linkup integration has been completed","linkup_update_description":"You can find your API keys at this link.","markdown":"Markdown","new":"New","newest":"Newest","not_supported":"Not supported","not_supported_in_this_model":"Not supported in this model.","off":"Off","oldest":"Oldest","on":"On","optional":"optional","output":"Output","please_check_your_connection":"Please check your connection and try again.","prompt":"Prompt","read_docs":"Read docs","reasoning_mode":"Reasoning mode","refresh":"Refresh","reload":"Reload","remove":"Remove","rename":"Rename","reset":"Reset","restart":"Restart","resume_generation":"Resume generation","resume_generation_tooltip":"Enable to continue text generation even after an error occurs during a tool call.","retry":"Retry","save":"Save","settings":"Settings","start":"Start","status":"Status","step":"Step","supported":"Supported","token":"Token","tool_status":"Tool status","tool_status_tooltip":"Enable to view real-time tool status updates.","try":"Try","unknown":"Unknown","update":"Update","updated":"Updated {datetime}","updated_at_datetime":"Updated at {datetime}","updated_datetime":"Updated {datetime}","upload":"Upload","use":"Use","user_created_datetime":"{username} created {datetime}","user_updated_datetime":"{username} updated {datetime}","view":"View","view_code":"View code","weights_and_biases":"Weights & Biases","weights_and_biases_api_key":"Weights & Biases API key","weights_and_biases_api_key_saved":"Weights & Biases API key saved","weights_and_biases_integration":"Weights & Biases integration","weights_and_biases_integration_description":"To connect your Weights & Biases account, you need to register your Weights & Biases API key. You can find your API keys at this link.","weights_and_biases_update_description":"You can find your API keys at this link.","you_can_create_pat_here":"You can create a friendli token here.","your_hugging_face_access_token":"Your Hugging Face access token","your_linkup_api_key":"Your Linkup API key","your_weights_and_biases_api_key":"Your Weights & Biases API key"},"solutions":{"finetuning":{"achieve_rapid_model_customization_with_high_quality_results":"Achieve rapid model customization with high-quality results while significantly reducing computational resource requirements.","book_demo":"Book demo","cost_time_and_dataset_efficiency":"Cost, time and dataset efficiency","dedicated_expert_support":"Dedicated expert support","effortlessly_deploy_your_finetuned_models":"Effortlessly deploy your fine-tuned models","experience_fully_handsoff_model_training_service":"Experience a fully hands-off model training service. Our AI experts handle everything from\nmodel selection\nand dataset preparation to fine-tuning and deployment, ensuring a seamless process for you.","friendli_suite_not_only_enables":"Friendli Suite not only enables you to easily fine-tune your models but also streamlines the deployment process. You can run your fine-tuned models on autopilot with just a few clicks with Friendli Dedicated Endpoints or meet your privacy and security needs in your own private environment with Friendli Container.","harness_the_power_of_multiple_gpus":"Harness the power of multiple GPUs to speed up the fine-tuning process.","learn_more":"Learn more","leverage_smaller_cost_effective_models":"Leverage smaller, cost-effective models to outperform expensive ones in certain domains.","looking_for_finetuning_experts":"Looking for fine-tuning experts?","need_expert_help":"Need expert help?","optimize_gen_ai_performance":"Optimize generative AI performance by customizing models","optimize_open_source_or_pretrained_custom_models":"Optimize open-source or pre-trained custom models with your enterprise data to specialize particular domains or tasks.","optimized_multi_gpu_training":"Optimized multi-GPU training","our_team_of_ai_experts_will_work_with_you":"Our team of AI experts will work with you on the entire process of fine-tuning, ensuring that your model is tailored to meet your unique needs efficiently and effectively.","parameter_efficient_finetuning":"Parameter-efficient fine-tuning","seamlessly_deploy_your_finetuned_model":"Seamlessly deploy your fine-tuned model right away in Friendli Dedicated Endpoints","serve_finetuned_model_in_one_click":"Serve a fine-tuned model in one-click","serve_your_finetuned_model_within_your_own_private_environment":"Serve your fine-tuned model within your own private environment to meet your privacy and security needs.","start_your_finetuning_project":"Start your fine-tuning project now\nfor your custom model","streamline_from_finetuning_to_serving":"Streamline from fine-tuning to serving","this_seamless_process_ensures":"This seamless process ensures high performance and cost-efficiency for your operations.","try_finetuning":"Try fine-tuning","try_now":"Try now","unlock_your_business":"Unlock your business’s potential with fine-tuned models. Use your data to achieve precise,\nindustry-specific outputs, enhancing performance\nwhile saving time and resources.","view_supported_models":"View supported models","why_choose_friendli_finetuning":"Why choose Friendli Fine-Tuning?","why_finetuning":"Why fine-tuning?"},"inference":{"build_and_run_gen_ai_models_on_autopilot":"Build and run generative AI models on autopilot","call_our_fast_and_affordable_api":"Call our fast and affordable API for open-source generative AI models","cost_savings":"Cost savings","deploy_llms_and_more":"Deploy LLMs and more!","even_faster_ttft":"Even faster TTFT with Friendli TCache","fastest_llm_inference_engine_on_market":"The fastest LLM inference engine\non the market","fewer":"Fewer","fine_tune_and_deploy_llms":"Fine-tune and deploy LLMs with H100 GPUs on Friendli Dedicated Endpoints.","friendli_dnn_library_set_of_optimized_gpu_kernels":"Friendli DNN Library is the set of optimized GPU kernels carefully curated and designed specifically for generative AI. Our novel library allows Friendli Inference to support faster LLM inference of various tensor shapes and datatypes, as well as support quantization, Mixture of Experts, LoRA adapters, and so on.","friendli_engine":"Friendli Inference","friendli_engine_is_highly_optimized":"Friendli Inference is highly optimized to make LLM serving fast and cost-effective. Process LLM inference with Friendli Inference, the fastest engine on the market. Our performance testing shows that Friendli Inference is significantly faster than vLLM and TensorRT-LLM.","friendli_engine_natively_supports_speculative_decoding":" Friendli Inference natively supports speculative decoding, an optimization technique that rapidly speeds up LLM/LMM inference by making educated guesses on future tokens in parallel while generating the current token. Through validation of the generated potential future tokens, speculative decoding ensures identical model outputs at a fraction of the inference time.","friendli_engine_simultaneously_supports_multiple_lora":"Friendli Inference simultaneously supports multiple LoRA models on fewer GPUs (even on just a single GPU!), a remarkable leap in making LLM customization more accessible and efficient.","friendli_engine_supports_wide_range":"Friendli Inference supports a wide range of generative AI models, including quantized models and MoE.","friendli_tcache_intelligently":"Friendli TCache intelligently identifies and stores frequently used computational results. The Friendli Inference leverages the cached results, significantly reducing the workload on the GPUs.","friendli_tcache_reuses_recurring":"Friendli TCache reuses recurring computations, optimizing TTFT (Time to First Token) by leveraging cached results. We show that our Engine delivers 11.3x to 23x faster TTFT compared to vLLM.","get_started":"Get started","gpus_required":"GPUs required","groundbreaking_performance":"GROUNDBREAKING PERFORMANCE","higher":"Higher","highlights":"Highlights","how_to_use":"HOW TO USE","iteration_batching_new_tech":"Iteration batching is a new batching technology we invented to handle concurrent generation requests very efficiently. Iteration batching can achieve up to tens of times higher LLM inference throughput than conventional batching while satisfying the same latency requirement. Our technology is protected by our patents in the US, Korea and China","key_technology":"Key Technology","latency":"Latency","learn_more":"Learn more","lower":"Lower","multi_lora_serving_single_gpu":"Multi-LoRA serving on a single GPU","quantized_llama_on_single_gpu":"Quantized Llama 2 70B on Single GPU","read_docs":"Read the docs","read_more":"Read more","running_quantized_mixtral":"Running Quantized Mixtral 8x7B on a Single GPU","serve_llm_and_lmm_inferences_with_friendli_engine_in_your_gpu_environment":"Serve LLM and LMM inferences with Friendli Inference in your private environment","speed_up_serving_of_llms":"Speed up the serving of LLMs,\nthus slashing costs by","three_ways_to":"Three ways to run generative AI models with Friendli Inference:","throughput":"Throughput","try_for_free":"Try for free","up_to":"up to","view_full_model_list":"View the full model list","we_quantized_mixtral_with_awq":"We quantized the Mixtral-7x8B-instruct v0.1 model with AWQ and ran it on a single NVIDIA A100 80GB GPU. Both the TTFT and TPOT outnumbers a baseline vLLM system. Friendli Inference achieves at least 4.1x faster response time and 3.8x ~ 23.8x higher token throughput.","what_friendli_engine_offers":"What Friendli Inference offers","with_friendli_engine_running_awqed_models_is_seamless":"With Friendli Inference, running AWQ-ed models is seamless. For example, one can run AWQ-ed LLMs (e.g., Llama 2 70B 4-bit on a single A100 80 GB GPU) natively on Friendli Inference. Running LLMs with AWQ on Friendli Inference enables you to achieve efficient LLM deployment and remarkable efficiency gains without sacrificing accuracy."}},"subscription":{"api_features":"API features:\nOpenAI-compatible APIs, long context handling, function calling & JSON mode, gRPC APIs","basic":"Basic","billing":"Billing","built_in_tools_etc":"Built-in tools (Document parsing, web search, code interpreter, etc.)","choose_plan":"Choose plan","configurable_autoscaling":"Configurable autoscaling","contact_owner":"Contact owner","contact_owner_tooltip":"Contact the team owner or admin to get free credits.","contact_sales":"Talk to an engineer","contact_sales_to_increase_limits":"Contact sales to increase limits","contact_us":"Contact us","container":"Container","container_plan_ended_message":"To continue using Friendli Container, please upgrade to the enterprise plan.","container_start_guide_description":"Friendli Container enables secure, efficient AI inference on your own infrastructure with existing GPUs.","container_start_guide_title":"Optimized Generative AI Inference Container","count_days_left":"{count} days left","create_endpoints_directly_from_hugging_face":"Create endpoints directly from Hugging Face","current_plan":"Current plan","custom":"Custom","custom_contract_based_on_gpu_type_usage":"Custom contract based on GPU type and usage","custom_pricing":"Custom pricing","customer_support_during_business_hours":"Customer support during business hours","dedicated_credits_expired":"Your team has used all free credits. To continue using Friendli Dedicated Endpoints, please add a payment method. Then, your team can access our services, and you will only be charged for the usage. Details on prices can be found in our pricing page.","dedicated_customer_support":"Dedicated customer support","dedicated_endpoints":"Dedicated endpoints","dedicated_endpoints_start_guide_description":"Friendli Dedicated Endpoints is a one-click GPU platform for AI inference, offering a proprietary high-performance engine and fully managed infrastructure for serving and training custom models on dedicated GPUs.","dedicated_endpoints_start_guide_title":"Inference and Training Acceleration Platform","dedicated_support":"Dedicated support","email_in_app_chat_support":"Email & In-app chat support","enterprise":"Enterprise","environment_support":"Environment support:\nRun in local, cloud, or AWS SageMaker environments","environment_support_air_gapped_production":"Environment support\nRun in air-gapped or production environments","everything_in_basic_plus":"Everything in Basic, plus","everything_in_starter_plus":"Everything in Starter, plus","everything_in_trial_plus":"Everything in Trial, plus","failed_to_get_credits":"Failed to get credits","failed_to_get_plan_information":"Failed to get plan information","fine_tune_custom_models":"Fine-tune custom models","free_trial_credits":"Free trial credits","function_calling_and_json_mode":"Function calling & JSON mode","get_free_credits":"Get free credits","get_started":"Get started","get_started_free":"Get started free","get_started_with":"Get started with","get_value_free_credits":"Get ${value} free credits","long_context_handling":"Long context handling (128K)","metrics_logs":"Metrics & logs","model_serving":"Model serving:\nHugging Face models, quantized models, MoE models, inference optimization","multi_lora_deployments":"Multi-LoRA deployments","on_trial":"On trial","openai_compatible_apis":"OpenAI-compatible APIs","optimized_inference_apis":"Optimized inference APIs","out_of_credits":"Out of credits","pay_as_you_go":"Pay as you go","pricing":"Pricing","priority_access_to_high_demand_gpus":"Priority access to high-demand GPUs","rate_limits":"Rate limits","read_the_docs":"Read the docs","remaining":"Remaining","remaining_credits":"Remaining credits","request_trial":"Request trial","serverless_credits_expired":"Your team has used all free credits. To continue using Friendli Serverless Endpoints, please add a payment method and upgrade your plan. Then, your team can access our services with increased rate limits, and you will only be charged for the usage. Details on prices can be found in our pricing page.","serverless_endpoints":"Serverless endpoints","serverless_endpoints_start_guide_description":"Friendli Serverless Endpoints lets you easily run and build generative AI apps using various open-source models.","serverless_endpoints_start_guide_title":"Optimized Model Execution API","start_building_with_friendli_dedicated_endpoints":"Start building with Friendli Dedicated Endpoints.","start_building_with_friendli_serverless_endpoints":"Start building with Friendli Serverless Endpoints.","start_from":"Start from","starter":"Starter","subscribe":"Subscribe","subscription":"Subscription","training_assistance_from_friendliai_experts":"Training assistance from FriendliAI experts","trial":"Trial","try_now":"Try now","unlimited":"Unlimited","upgrade":"Upgrade","upgrade_plan":"Upgrade plan","used":"Used","used_of_total_used":"{usedAmount}of{totalAmount}used","view_plan":"View plan","want_to_learn_more_about_rate_limits":"Want to learn more about rate limits?","with_free_credits":"with free credits","you_have_got_free_credits":"You’ve got free credits!","your_team_is_on_the_plan":"Your team is on the (unknown) plan."}},"now":"$undefined","timeZone":"UTC","children":"$L49"}]

Models

Explore FriendliAI today