Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 0 additions & 2 deletions src/CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -3,9 +3,7 @@ add_subdirectory(common)
add_subdirectory(handlers)
add_subdirectory(kernels)
add_subdirectory(tokenizer)
add_subdirectory(module)
add_subdirectory(layers)
add_subdirectory(quantization)
add_subdirectory(models)
add_subdirectory(model_loader)
add_subdirectory(model_parallel)
Expand Down
2 changes: 1 addition & 1 deletion src/engine/llm_engine.h
Original file line number Diff line number Diff line change
Expand Up @@ -5,8 +5,8 @@
#include "batch.h"
#include "common/macros.h"
#include "engine.h"
#include "layers/quantization/quant_args.h"
#include "memory/block_manager.h"
#include "quantization/quant_args.h"
#include "tokenizer/tokenizer.h"
#include "tokenizer/tokenizer_args.h"
#include "worker.h"
Expand Down
2 changes: 1 addition & 1 deletion src/engine/worker.h
Original file line number Diff line number Diff line change
Expand Up @@ -4,14 +4,14 @@
#include <torch/torch.h>

#include "common/threadpool.h"
#include "layers/quantization/quant_args.h"
#include "model_loader/state_dict.h"
#include "model_parallel/parallel_args.h"
#include "model_runner.h"
#include "models/causal_lm.h"
#include "models/model_args.h"
#include "models/parameters.h"
#include "parameters.h"
#include "quantization/quant_args.h"

namespace llm {

Expand Down
2 changes: 1 addition & 1 deletion src/engine/worker_test.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -4,9 +4,9 @@

#include "engine/batch.h"
#include "engine/utils.h"
#include "layers/quantization/quant_args.h"
#include "memory/block_manager.h"
#include "models/simple_model.h"
#include "quantization/quant_args.h"
namespace llm {

class TestableWorker {
Expand Down
31 changes: 3 additions & 28 deletions src/layers/CMakeLists.txt
Original file line number Diff line number Diff line change
@@ -1,32 +1,6 @@
include(cc_library)
include(cc_test)

cc_library(
NAME
linear
HDRS
linear.h
qkv_linear.h
linear_impl.h
fused_linear.h
weight_utils.h
SRCS
linear.cpp
qkv_linear.cpp
linear_impl.cpp
fused_linear.cpp
weight_utils.cpp
DEPS
:state_dict
:model_parallel
:quantization
:kernels
:module
glog::glog
gflags::gflags
torch
)

cc_library(
NAME
pos_embedding
Expand Down Expand Up @@ -73,14 +47,15 @@ cc_test(
activation_test.cpp
pos_embedding_test.cpp
normalization_test.cpp
linear_test.cpp
qkv_linear_test.cpp
DEPS
:layers
:state_dict
absl::random_random
:gtest_main
)

add_subdirectory(module)
add_subdirectory(linear)
add_subdirectory(quantization)
add_subdirectory(attention)
add_subdirectory(moe)
4 changes: 2 additions & 2 deletions src/layers/attention/attention.h
Original file line number Diff line number Diff line change
Expand Up @@ -3,10 +3,10 @@
#include <torch/torch.h>

#include "layers/attention/handler.h"
#include "layers/module/module.h"
#include "layers/module/module_holder.h"
#include "memory/kv_cache.h"
#include "models/parameters.h"
#include "module/module.h"
#include "module/module_holder.h"

namespace llm {

Expand Down
4 changes: 2 additions & 2 deletions src/layers/embedding.h
Original file line number Diff line number Diff line change
Expand Up @@ -5,10 +5,10 @@

#include <cstdint>

#include "layers/module/module.h"
#include "layers/module/module_holder.h"
#include "model_loader/state_dict.h"
#include "model_parallel/model_parallel.h"
#include "module/module.h"
#include "module/module_holder.h"

namespace llm {

Expand Down
102 changes: 0 additions & 102 deletions src/layers/fused_linear.cpp

This file was deleted.

56 changes: 0 additions & 56 deletions src/layers/fused_linear.h

This file was deleted.

80 changes: 0 additions & 80 deletions src/layers/linear.h

This file was deleted.

Loading