branch: elpa/gptel commit 54687edb3d821652ca6e6f87fe472674d322a5e7 Author: Savva Surenkov <savva@surenkov.space> Commit: GitHub <nore...@github.com>
gptel-gemini: add gemini-2.5-flash-lite GA model (#986) gptel-gemini.el (gptel--gemini-models): Also remove duplicate definitions of gemini-2.5-flash-lite-preview-06-17 and gemini-2.5-flash. --- gptel-gemini.el | 49 ++++++++++++++++++++++--------------------------- 1 file changed, 22 insertions(+), 27 deletions(-) diff --git a/gptel-gemini.el b/gptel-gemini.el index e58863b5ac..c5b5e43774 100644 --- a/gptel-gemini.el +++ b/gptel-gemini.el @@ -503,9 +503,9 @@ files in the context." "application/pdf" "text/plain" "text/csv" "text/html" "audio/mpeg" "audio/wav" "audio/ogg" "audio/flac" "audio/aac" "audio/mp3" "video/mp4" "video/mpeg" "video/avi" "video/quicktime" "video/webm") - :context-window 1024 - :input-cost 0.15 - :output-cost 0.60 + :context-window 1048 ; 65536 output token limit + :input-cost 0.3 + :output-cost 2.50 :cutoff-date "2025-01") (gemini-2.5-pro-preview-05-06 :description "Previously most powerful thinking model with state-of-the-art performance" @@ -526,22 +526,29 @@ files in the context." :output-cost 10.00 ; 15 for >200k tokens :cutoff-date "2025-01") (gemini-2.5-flash-lite-preview-06-17 - :description "A Gemini 2.5 Flash model optimized for cost efficiency and low latency" - :capabilities (tool-use json media) - :mime-types ("image/png" "image/jpeg" "image/webp" "image/heic" "image/heif" - "application/pdf" "text/plain" "text/csv" "text/html") - :context-window 1000 ; 64000 output token limit + :description "Fastest and cheapest 2.5 model, for high-volume, latency-sensitive tasks." + :capabilities (tool-use json media audio video) + :mime-types ("image/png" "image/jpeg" "image/webp" "application/pdf" "text/plain" + "audio/x-aac" "audio/flac" "audio/mp3" "audio/m4a" "audio/mpeg" + "audio/mpga" "audio/mp4" "audio/opus" "audio/pcm" "audio/wav" "audio/webm" + "video/x-flv" "video/quicktime" "video/mpeg" "video/mp4" + "video/webm" "video/wmv" "video/3gpp") + :context-window 1048 ; 65536 output token limit :input-cost 0.10 :output-cost 0.40 :cutoff-date "2025-01") - (gemini-2.5-flash - :description "Best model in terms of price-performance, offering well-rounded capabilities." + (gemini-2.5-flash-lite + :description "Fastest and cheapest 2.5 model, for high-volume, latency-sensitive tasks." :capabilities (tool-use json media) - :mime-types ("image/png" "image/jpeg" "image/webp" "image/heic" "image/heif" - "application/pdf" "text/plain" "text/csv" "text/html") - :context-window 1048 ; 65536 output token limit - :input-cost 0.3 - :output-cost 2.50 + :capabilities (tool-use json media audio video) + :mime-types ("image/png" "image/jpeg" "image/webp" "application/pdf" "text/plain" + "audio/x-aac" "audio/flac" "audio/mp3" "audio/m4a" "audio/mpeg" + "audio/mpga" "audio/mp4" "audio/opus" "audio/pcm" "audio/wav" "audio/webm" + "video/x-flv" "video/quicktime" "video/mpeg" "video/mp4" + "video/webm" "video/wmv" "video/3gpp") + :context-window 1048 ; 64000 output token limit + :input-cost 0.10 + :output-cost 0.40 :cutoff-date "2025-01") (gemini-2.5-pro :description "Most powerful Gemini thinking model with state-of-the-art performance" @@ -554,18 +561,6 @@ files in the context." :input-cost 1.25 ; 2.50 for >200k tokens :output-cost 10.00 ; 15 for >200k tokens :cutoff-date "2025-01") - (gemini-2.5-flash-lite-preview-06-17 - :description "Fastest and cheapest 2.5 model, for high-volume, latency-sensitive tasks." - :capabilities (tool-use json media audio video) - :mime-types ("image/png" "image/jpeg" "image/webp" "application/pdf" "text/plain" - "audio/x-aac" "audio/flac" "audio/mp3" "audio/m4a" "audio/mpeg" - "audio/mpga" "audio/mp4" "audio/opus" "audio/pcm" "audio/wav" "audio/webm" - "video/x-flv" "video/quicktime" "video/mpeg" "video/mp4" - "video/webm" "video/wmv" "video/3gpp") - :context-window 1048 - :input-cost 0.075 - :output-cost 0.30 - :cutoff-date "2025-01") (gemini-2.0-flash-thinking-exp :description "DEPRECATED: Please use gemini-2.0-flash-thinking-exp-01-21 instead." :capabilities (tool-use media)