anthropic.php
8 hours ago
chatml.php
1 week ago
core.php
2 days ago
custom.php
1 month ago
factory.php
1 week ago
google-interactions.php
2 days ago
google.php
1 week ago
mistral.php
1 week ago
open-router.php
3 weeks ago
openai.php
3 weeks ago
ovh.php
1 week ago
perplexity.php
6 months ago
replicate.php
5 months ago
xai.php
1 month ago
custom.php
216 lines
| 1 | <?php |
| 2 | |
| 3 | /** |
| 4 | * Generic OpenAI-compatible engine. Lets users point AI Engine at any server that speaks the |
| 5 | * OpenAI Chat Completions API (Ollama, LM Studio, vLLM, llama.cpp, LocalAI, TGI in OAI mode, |
| 6 | * smaller hosted providers, etc.). Endpoint is user-configurable; API key is optional since |
| 7 | * many local servers run unauthenticated. |
| 8 | */ |
| 9 | class Meow_MWAI_Engines_Custom extends Meow_MWAI_Engines_ChatML { |
| 10 | public function __construct( $core, $env ) { |
| 11 | parent::__construct( $core, $env ); |
| 12 | } |
| 13 | |
| 14 | protected function set_environment() { |
| 15 | $env = $this->env; |
| 16 | $this->apiKey = $env['apikey'] ?? null; |
| 17 | } |
| 18 | |
| 19 | protected function get_service_name() { |
| 20 | return ! empty( $this->env['name'] ) ? $this->env['name'] : 'Custom'; |
| 21 | } |
| 22 | |
| 23 | public function get_models() { |
| 24 | // Prefer dynamically-fetched models, fall back to whatever the user added manually for this |
| 25 | // env type via the Custom Models UI. No static list, since the model lineup is whatever the |
| 26 | // user's server happens to expose. |
| 27 | return $this->core->get_engine_models( 'custom' ); |
| 28 | } |
| 29 | |
| 30 | public static function get_models_static() { |
| 31 | return []; |
| 32 | } |
| 33 | |
| 34 | protected function build_url( $query, $endpoint = null ) { |
| 35 | $base = $this->resolve_endpoint(); |
| 36 | if ( $query instanceof Meow_MWAI_Query_Text || $query instanceof Meow_MWAI_Query_Feedback ) { |
| 37 | return $base . '/chat/completions'; |
| 38 | } |
| 39 | if ( $query instanceof Meow_MWAI_Query_Embed ) { |
| 40 | return $base . '/embeddings'; |
| 41 | } |
| 42 | throw new Exception( 'Unsupported query type for the Custom (OpenAI-Compatible) provider.' ); |
| 43 | } |
| 44 | |
| 45 | /** |
| 46 | * Bearer auth is optional here. Most local servers (Ollama default install, LM Studio, |
| 47 | * llama.cpp server) do not require an API key; hosted OpenAI-compatible endpoints typically |
| 48 | * do. Only attach the Authorization header when the user has set a key. |
| 49 | */ |
| 50 | protected function build_headers( $query ) { |
| 51 | if ( $query->apiKey ) { |
| 52 | $this->apiKey = $query->apiKey; |
| 53 | } |
| 54 | $headers = [ |
| 55 | 'Content-Type' => 'application/json', |
| 56 | 'User-Agent' => 'AI Engine', |
| 57 | ]; |
| 58 | if ( ! empty( $this->apiKey ) ) { |
| 59 | $headers['Authorization'] = 'Bearer ' . $this->apiKey; |
| 60 | } |
| 61 | return $headers; |
| 62 | } |
| 63 | |
| 64 | protected function build_body( $query, $streamCallback = null, $extra = null ) { |
| 65 | $body = parent::build_body( $query, $streamCallback, $extra ); |
| 66 | |
| 67 | // Most OAI-compatible servers expect the older max_tokens field, not max_completion_tokens. |
| 68 | if ( isset( $body['max_completion_tokens'] ) ) { |
| 69 | $body['max_tokens'] = $body['max_completion_tokens']; |
| 70 | unset( $body['max_completion_tokens'] ); |
| 71 | } |
| 72 | |
| 73 | return $body; |
| 74 | } |
| 75 | |
| 76 | /** |
| 77 | * Resolve the endpoint URL. Defaults to the Ollama localhost URL since that is the most |
| 78 | * common starting point; users override per-env in settings. |
| 79 | */ |
| 80 | private function resolve_endpoint() { |
| 81 | $endpoint = ! empty( $this->env['endpoint'] ) ? $this->env['endpoint'] : 'http://localhost:11434/v1'; |
| 82 | $endpoint = apply_filters( 'mwai_custom_endpoint', $endpoint, $this->env ); |
| 83 | return rtrim( $endpoint, '/' ); |
| 84 | } |
| 85 | |
| 86 | /** |
| 87 | * Try to discover models from /v1/models. Servers that don't implement this endpoint |
| 88 | * (some llama.cpp builds, custom proxies) just return an empty list — users add models |
| 89 | * manually through AI Engine's existing custom-models UI. |
| 90 | */ |
| 91 | public function retrieve_models() { |
| 92 | $base = $this->resolve_endpoint(); |
| 93 | $url = $base . '/models'; |
| 94 | |
| 95 | $headers = [ 'User-Agent' => 'AI Engine' ]; |
| 96 | if ( ! empty( $this->apiKey ) ) { |
| 97 | $headers['Authorization'] = 'Bearer ' . $this->apiKey; |
| 98 | } |
| 99 | |
| 100 | $response = wp_remote_get( $url, [ |
| 101 | 'headers' => $headers, |
| 102 | 'timeout' => 10, |
| 103 | 'sslverify' => MWAI_SSL_VERIFY, |
| 104 | ] ); |
| 105 | |
| 106 | if ( is_wp_error( $response ) ) { |
| 107 | Meow_MWAI_Logging::log( 'Custom (OpenAI-Compatible): /models fetch failed: ' . $response->get_error_message() ); |
| 108 | return []; |
| 109 | } |
| 110 | |
| 111 | $code = wp_remote_retrieve_response_code( $response ); |
| 112 | if ( $code >= 400 ) { |
| 113 | Meow_MWAI_Logging::log( "Custom (OpenAI-Compatible): /models returned HTTP {$code}." ); |
| 114 | return []; |
| 115 | } |
| 116 | |
| 117 | $body = json_decode( wp_remote_retrieve_body( $response ), true ); |
| 118 | if ( ! isset( $body['data'] ) || ! is_array( $body['data'] ) ) { |
| 119 | return []; |
| 120 | } |
| 121 | |
| 122 | $models = []; |
| 123 | foreach ( $body['data'] as $remote ) { |
| 124 | $modelId = $remote['id'] ?? ''; |
| 125 | if ( empty( $modelId ) ) { |
| 126 | continue; |
| 127 | } |
| 128 | $isEmbedding = strpos( strtolower( $modelId ), 'embed' ) !== false; |
| 129 | $features = $isEmbedding ? [ 'embedding' ] : [ 'completion' ]; |
| 130 | $tags = [ 'core', $isEmbedding ? 'embedding' : 'chat' ]; |
| 131 | |
| 132 | $modelData = [ |
| 133 | 'model' => $modelId, |
| 134 | 'name' => $modelId, |
| 135 | 'family' => 'custom', |
| 136 | 'features' => $features, |
| 137 | // Pricing is unknown for self-hosted/third-party servers — zero out so usage tracking |
| 138 | // doesn't invent costs. Users can add per-model pricing through the Custom Models UI. |
| 139 | 'price' => [ 'in' => 0, 'out' => 0 ], |
| 140 | 'type' => 'token', |
| 141 | 'unit' => 1 / 1000000, |
| 142 | 'maxCompletionTokens' => isset( $remote['max_output_tokens'] ) ? (int) $remote['max_output_tokens'] : 4096, |
| 143 | 'maxContextualTokens' => isset( $remote['context_window'] ) ? (int) $remote['context_window'] : 8192, |
| 144 | 'tags' => $tags, |
| 145 | ]; |
| 146 | |
| 147 | if ( $isEmbedding ) { |
| 148 | $modelData['dimensions'] = isset( $remote['dimensions'] ) ? (int) $remote['dimensions'] : 1536; |
| 149 | } |
| 150 | |
| 151 | $models[] = $modelData; |
| 152 | } |
| 153 | return $models; |
| 154 | } |
| 155 | |
| 156 | /** |
| 157 | * Hits /v1/models directly so the user gets a real success/error response. Works without an |
| 158 | * API key, surfaces real HTTP errors when they happen. |
| 159 | */ |
| 160 | public function connection_check() { |
| 161 | $base = $this->resolve_endpoint(); |
| 162 | $url = $base . '/models'; |
| 163 | $details = [ 'endpoint' => $url ]; |
| 164 | |
| 165 | $headers = [ 'User-Agent' => 'AI Engine' ]; |
| 166 | if ( ! empty( $this->apiKey ) ) { |
| 167 | $headers['Authorization'] = 'Bearer ' . $this->apiKey; |
| 168 | } |
| 169 | |
| 170 | $response = wp_remote_get( $url, [ |
| 171 | 'headers' => $headers, |
| 172 | 'timeout' => 10, |
| 173 | 'sslverify' => MWAI_SSL_VERIFY, |
| 174 | ] ); |
| 175 | |
| 176 | if ( is_wp_error( $response ) ) { |
| 177 | return [ |
| 178 | 'success' => false, 'service' => $this->get_service_name(), |
| 179 | 'error' => $response->get_error_message(), |
| 180 | 'details' => $details, |
| 181 | ]; |
| 182 | } |
| 183 | |
| 184 | $code = wp_remote_retrieve_response_code( $response ); |
| 185 | $body = json_decode( wp_remote_retrieve_body( $response ), true ); |
| 186 | |
| 187 | if ( $code >= 400 || ( is_array( $body ) && isset( $body['error'] ) ) ) { |
| 188 | $message = is_array( $body ) && isset( $body['error'] ) |
| 189 | ? ( is_string( $body['error'] ) ? $body['error'] : ( $body['error']['message'] ?? json_encode( $body['error'] ) ) ) |
| 190 | : "HTTP {$code} from {$url}."; |
| 191 | return [ |
| 192 | 'success' => false, 'service' => $this->get_service_name(), |
| 193 | 'error' => $message, |
| 194 | 'details' => array_merge( $details, [ 'http_code' => $code ] ), |
| 195 | ]; |
| 196 | } |
| 197 | |
| 198 | $modelIds = []; |
| 199 | if ( isset( $body['data'] ) && is_array( $body['data'] ) ) { |
| 200 | foreach ( array_slice( $body['data'], 0, 5 ) as $m ) { |
| 201 | if ( isset( $m['id'] ) ) { |
| 202 | $modelIds[] = $m['id']; |
| 203 | } |
| 204 | } |
| 205 | } |
| 206 | return [ |
| 207 | 'success' => true, 'service' => $this->get_service_name(), |
| 208 | 'message' => 'Connection successful. Found ' . count( $body['data'] ?? [] ) . ' models.', |
| 209 | 'details' => array_merge( $details, [ |
| 210 | 'model_count' => count( $body['data'] ?? [] ), |
| 211 | 'sample_models' => $modelIds, |
| 212 | ] ), |
| 213 | ]; |
| 214 | } |
| 215 | } |
| 216 |