AI rule node: add dedicated thread pool for AI requests
This commit is contained in:
parent
db5e4f8d91
commit
ff23fa03c0
@ -30,6 +30,7 @@ import org.springframework.context.annotation.Lazy;
|
||||
import org.springframework.data.redis.core.RedisTemplate;
|
||||
import org.springframework.stereotype.Component;
|
||||
import org.thingsboard.common.util.JacksonUtil;
|
||||
import org.thingsboard.rule.engine.api.AiRequestsExecutor;
|
||||
import org.thingsboard.rule.engine.api.DeviceStateManager;
|
||||
import org.thingsboard.rule.engine.api.MailService;
|
||||
import org.thingsboard.rule.engine.api.MqttClientSettings;
|
||||
@ -319,6 +320,10 @@ public class ActorSystemContext {
|
||||
@Getter
|
||||
private AiSettingsService aiSettingsService;
|
||||
|
||||
@Autowired
|
||||
@Getter
|
||||
private AiRequestsExecutor aiRequestsExecutor;
|
||||
|
||||
@Autowired
|
||||
@Getter
|
||||
private EntityViewService entityViewService;
|
||||
|
||||
@ -23,6 +23,7 @@ import org.bouncycastle.util.Arrays;
|
||||
import org.thingsboard.common.util.DebugModeUtil;
|
||||
import org.thingsboard.common.util.JacksonUtil;
|
||||
import org.thingsboard.common.util.ListeningExecutor;
|
||||
import org.thingsboard.rule.engine.api.AiRequestsExecutor;
|
||||
import org.thingsboard.rule.engine.api.DeviceStateManager;
|
||||
import org.thingsboard.rule.engine.api.MailService;
|
||||
import org.thingsboard.rule.engine.api.MqttClientSettings;
|
||||
@ -1024,6 +1025,11 @@ public class DefaultTbContext implements TbContext {
|
||||
return mainCtx.getAiSettingsService();
|
||||
}
|
||||
|
||||
@Override
|
||||
public AiRequestsExecutor getAiRequestsExecutor() {
|
||||
return mainCtx.getAiRequestsExecutor();
|
||||
}
|
||||
|
||||
@Override
|
||||
public MqttClientSettings getMqttClientSettings() {
|
||||
return mainCtx.getMqttClientSettings();
|
||||
|
||||
@ -0,0 +1,43 @@
|
||||
/**
|
||||
* Copyright © 2016-2025 The Thingsboard Authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
package org.thingsboard.server.service.ai;
|
||||
|
||||
import jakarta.validation.constraints.Min;
|
||||
import jakarta.validation.constraints.NotBlank;
|
||||
import lombok.Data;
|
||||
import org.springframework.boot.context.properties.ConfigurationProperties;
|
||||
import org.springframework.context.annotation.Configuration;
|
||||
import org.springframework.validation.annotation.Validated;
|
||||
|
||||
@Data
|
||||
@Validated
|
||||
@Configuration
|
||||
@ConfigurationProperties(prefix = "actors.rule.ai-requests-thread-pool")
|
||||
class AiRequestsExecutorProperties {
|
||||
|
||||
@NotBlank(message = "Pool name must be not blank")
|
||||
private String poolName = "ai-requests";
|
||||
|
||||
@Min(value = 1, message = "Pool size must be at least 1")
|
||||
private int poolSize = 50;
|
||||
|
||||
@Min(value = 1, message = "Max queue size must be at least 1")
|
||||
private int maxQueueSize = 10000;
|
||||
|
||||
@Min(value = 1, message = "Termination timeout must be at least 1 second")
|
||||
private int terminationTimeoutSeconds = 60;
|
||||
|
||||
}
|
||||
@ -0,0 +1,63 @@
|
||||
/**
|
||||
* Copyright © 2016-2025 The Thingsboard Authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
package org.thingsboard.server.service.ai;
|
||||
|
||||
import com.google.common.util.concurrent.FluentFuture;
|
||||
import com.google.common.util.concurrent.ListeningExecutorService;
|
||||
import com.google.common.util.concurrent.MoreExecutors;
|
||||
import dev.langchain4j.model.chat.ChatModel;
|
||||
import dev.langchain4j.model.chat.request.ChatRequest;
|
||||
import dev.langchain4j.model.chat.response.ChatResponse;
|
||||
import jakarta.annotation.PostConstruct;
|
||||
import jakarta.annotation.PreDestroy;
|
||||
import lombok.RequiredArgsConstructor;
|
||||
import org.springframework.context.annotation.Lazy;
|
||||
import org.springframework.stereotype.Component;
|
||||
import org.thingsboard.common.util.ThingsBoardExecutors;
|
||||
import org.thingsboard.rule.engine.api.AiRequestsExecutor;
|
||||
|
||||
import java.time.Duration;
|
||||
|
||||
@Lazy
|
||||
@Component
|
||||
@RequiredArgsConstructor
|
||||
class DefaultAiRequestsExecutor implements AiRequestsExecutor {
|
||||
|
||||
private final AiRequestsExecutorProperties properties;
|
||||
|
||||
private ListeningExecutorService executorService;
|
||||
|
||||
@PostConstruct
|
||||
private void init() {
|
||||
executorService = MoreExecutors.listeningDecorator(
|
||||
ThingsBoardExecutors.newLimitedTasksExecutor(properties.getPoolSize(), properties.getMaxQueueSize(), properties.getPoolName())
|
||||
);
|
||||
}
|
||||
|
||||
@Override
|
||||
public FluentFuture<ChatResponse> sendChatRequestAsync(ChatModel chatModel, ChatRequest chatRequest) {
|
||||
return FluentFuture.from(executorService.submit(() -> chatModel.chat(chatRequest)));
|
||||
}
|
||||
|
||||
@PreDestroy
|
||||
private void destroy() {
|
||||
if (executorService != null) {
|
||||
MoreExecutors.shutdownAndAwaitTermination(executorService, Duration.ofSeconds(properties.getTerminationTimeoutSeconds()));
|
||||
executorService = null;
|
||||
}
|
||||
}
|
||||
|
||||
}
|
||||
@ -463,6 +463,16 @@ actors:
|
||||
allow_system_sms_service: "${ACTORS_RULE_ALLOW_SYSTEM_SMS_SERVICE:true}"
|
||||
# Specify thread pool size for external call service
|
||||
external_call_thread_pool_size: "${ACTORS_RULE_EXTERNAL_CALL_THREAD_POOL_SIZE:50}"
|
||||
# Configuration for the thread pool that executes HTTP calls to AI provider APIs
|
||||
ai-requests-thread-pool:
|
||||
# The base name for threads
|
||||
pool-name: "${ACTORS_RULE_AI_REQUESTS_THREAD_POOL_NAME:ai-requests}"
|
||||
# The maximum number of concurrent HTTP requests
|
||||
pool-size: "${ACTORS_RULE_AI_REQUESTS_THREAD_POOL_SIZE:50}"
|
||||
# The maximum queue size for pending AI requests
|
||||
max-queue-size: "${ACTORS_RULE_AI_REQUESTS_THREAD_POOL_QUEUE_SIZE:10000}"
|
||||
# The maximum time in seconds to wait for active tasks to complete during graceful shutdown
|
||||
termination-timeout-seconds: "${ACTORS_RULE_AI_REQUESTS_THREAD_POOL_TERMINATION_TIMEOUT_SECONDS:60}"
|
||||
chain:
|
||||
# Errors for particular actors are persisted once per specified amount of milliseconds
|
||||
error_persist_frequency: "${ACTORS_RULE_CHAIN_ERROR_FREQUENCY:3000}"
|
||||
|
||||
@ -0,0 +1,27 @@
|
||||
/**
|
||||
* Copyright © 2016-2025 The Thingsboard Authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
package org.thingsboard.rule.engine.api;
|
||||
|
||||
import com.google.common.util.concurrent.FluentFuture;
|
||||
import dev.langchain4j.model.chat.ChatModel;
|
||||
import dev.langchain4j.model.chat.request.ChatRequest;
|
||||
import dev.langchain4j.model.chat.response.ChatResponse;
|
||||
|
||||
public interface AiRequestsExecutor {
|
||||
|
||||
FluentFuture<ChatResponse> sendChatRequestAsync(ChatModel chatModel, ChatRequest chatRequest);
|
||||
|
||||
}
|
||||
@ -422,6 +422,8 @@ public interface TbContext {
|
||||
|
||||
AiSettingsService getAiSettingsService();
|
||||
|
||||
AiRequestsExecutor getAiRequestsExecutor();
|
||||
|
||||
// Configuration parameters for the MQTT client that is used in the MQTT node and Azure IoT hub node
|
||||
|
||||
MqttClientSettings getMqttClientSettings();
|
||||
|
||||
@ -26,6 +26,7 @@ import dev.langchain4j.model.chat.request.ChatRequest;
|
||||
import dev.langchain4j.model.chat.request.ResponseFormat;
|
||||
import dev.langchain4j.model.chat.request.ResponseFormatType;
|
||||
import dev.langchain4j.model.chat.request.json.JsonSchema;
|
||||
import dev.langchain4j.model.chat.response.ChatResponse;
|
||||
import dev.langchain4j.model.input.PromptTemplate;
|
||||
import org.checkerframework.checker.nullness.qual.NonNull;
|
||||
import org.thingsboard.common.util.JacksonUtil;
|
||||
@ -130,10 +131,11 @@ public final class TbAiNode extends TbAbstractExternalNode implements TbNode {
|
||||
.build();
|
||||
|
||||
configureChatModelAsync(ctx)
|
||||
.transform(chatModel -> sendChatRequest(chatModel, chatRequest), ctx.getExternalCallExecutor())
|
||||
.transformAsync(chatModel -> ctx.getAiRequestsExecutor().sendChatRequestAsync(chatModel, chatRequest), directExecutor())
|
||||
.addCallback(new FutureCallback<>() {
|
||||
@Override
|
||||
public void onSuccess(String response) {
|
||||
public void onSuccess(ChatResponse chatResponse) {
|
||||
String response = chatResponse.aiMessage().text();
|
||||
if (!isValidJsonObject(response)) {
|
||||
response = wrapInJsonObject(response);
|
||||
}
|
||||
@ -165,10 +167,6 @@ public final class TbAiNode extends TbAbstractExternalNode implements TbNode {
|
||||
}, ctx.getDbCallbackExecutor());
|
||||
}
|
||||
|
||||
private String sendChatRequest(ChatModel chatModel, ChatRequest chatRequest) {
|
||||
return chatModel.chat(chatRequest).aiMessage().text();
|
||||
}
|
||||
|
||||
private static boolean isValidJsonObject(String jsonString) {
|
||||
try {
|
||||
JsonNode result = JacksonUtil.toJsonNode(jsonString);
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user