下载
中文
注册

简介

数据类型LLVMReq定义在“${install_path}/latest/runtime/include/ge/llm_engine_types.h”。其中${install_path}为runtime安装路径,root用户的默认路径是“/usr/local/Ascend”。具体信息如下。

class LLMReq {
 public:
  LLMReq() = default;
  ~LLMReq() = default;
  //设置请求的id,不同请求的id不能重复
  void SetReqId(const uint64_t req_id) {
    req_id_ = req_id;
  }
  //获取请求id
  uint64_t GetReqId() const {
    return req_id_;
  }
  //设置全量kv的长度,当前暂没用到
  void SetPromptLength(const uint64_t prompt_length) {
    prompt_length_ = prompt_length;
  }
  //获取kv长度
  uint64_t GetPromptLength() const {
    return prompt_length_;
  }
 //设置请求所在的全量集群id
  void SetPromptClusterId(const uint64_t prompt_cluster_id) {
    prompt_cluster_id_ = prompt_cluster_id;
  }
 //获取请求所在的全量集群id
  uint64_t GetPromptClusterId() const {
    return prompt_cluster_id_;
  }
  //设置请求所在的增量集群id
  void SetDecoderClusterId(const uint64_t decoder_cluster_id) {
    decoder_cluster_id_ = decoder_cluster_id;
  }
  //获取请求所在的增量集群id
  uint64_t GetDecoderClusterId() const {
    return decoder_cluster_id_;
  }
  //预加载公共前缀
  void SetPrefixId(const uint64_t prefix_id) {
    prefix_id_ = prefix_id;
  }
  //释放公共前缀
  uint64_t GetPrefixId() const {
    return prefix_id_;
  }

  void SetSequenceLen(const uint64_t sequence_length) {
    sequence_length_ = sequence_length;
  }

  uint64_t GetSequenceLen() const {
    return sequence_length_;
  }

 private:
  uint64_t req_id_{0UL};
  // 请求prompt的句子长度,做完padding的值, 用于申请prompt的KVCache
  uint64_t prompt_length_{0UL};
  uint64_t prompt_cluster_id_{0UL};  // in/out, runPrompt的输出, runecoder的输入
  uint64_t decoder_cluster_id_{0UL};
  uint64_t prefix_id_{kInvalidPrefixId};
  int8_t reserved_[128];
};