Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
77 commits
Select commit Hold shift + click to select a range
c0bf108
test_utils refactor, local_cpu_allocator
dylanllim Jul 11, 2024
47ad0d8
test utils modification, cast, reverse, and replicate cpu kernels
dylanllim Jul 12, 2024
921fe65
combine kernel
dylanllim Jul 14, 2024
4ca67aa
combine kernels .h file
dylanllim Jul 14, 2024
86edf2e
Implementations for methods for machine_views and associated modules …
Marsella8 Jul 19, 2024
d9af610
test utils logic cleanup, reverse cpu_kernel pedagogical implmentatio…
dylanllim Jul 31, 2024
64034a5
cpu_kernel's refactor, generic tensor accessor indexing
dylanllim Oct 8, 2024
0304f17
accessor.h formatting
dylanllim Oct 8, 2024
7c3ff87
mk_runtime_error formatting
dylanllim Oct 8, 2024
65d7804
reverse_kernels include
dylanllim Oct 8, 2024
7c5fb1f
test_utils refactor and clarity
dylanllim Oct 15, 2024
8188afe
formatting
dylanllim Oct 15, 2024
a13255b
comment removal reverse_kernels
dylanllim Oct 15, 2024
7ed5624
Issue #1435, tests for managed stream and handle
dylanllim Oct 16, 2024
c1758c0
#1435 formatting
dylanllim Oct 16, 2024
54b3888
#1409 issue, change datatype for linear kernels away from void *
dylanllim Oct 16, 2024
5b5c2f6
R & W accessor changes, minimize code bloat
dylanllim Nov 5, 2024
ddae367
code formatting and refactor
dylanllim Nov 16, 2024
507df4a
issue #1502 & issue #1540
dylanllim Nov 22, 2024
c64a55c
format check
dylanllim Nov 22, 2024
a091652
branch merge and test fixes
dylanllim Jan 28, 2025
f19df3a
Merge remote-tracking branch 'origin/master' into cpu-kernels-tests-v2
dylanllim Jan 29, 2025
8860adf
build issues
dylanllim Jan 29, 2025
7b74acc
Add AWS linux AMI to runs-on for testing (#1589)
lockshaw Jan 30, 2025
8cdc677
Pin runs-on images (#1590)
lockshaw Jan 30, 2025
209db7e
GPU CI Fix (Pin runs-on GPU image) (#1588)
lockshaw Jan 31, 2025
0d2ffdb
Merge substitution-builder (#1575)
victorli2002 Feb 1, 2025
fe339eb
test_utils refactor, local_cpu_allocator
dylanllim Jul 11, 2024
2e2ae13
test utils modification, cast, reverse, and replicate cpu kernels
dylanllim Jul 12, 2024
6c30466
combine kernel
dylanllim Jul 14, 2024
5b5c591
test utils logic cleanup, reverse cpu_kernel pedagogical implmentatio…
dylanllim Jul 31, 2024
f0432c3
cpu_kernel's refactor, generic tensor accessor indexing
dylanllim Oct 8, 2024
74d186d
test_utils refactor and clarity
dylanllim Oct 15, 2024
f95d9da
R & W accessor changes, minimize code bloat
dylanllim Nov 5, 2024
8c8bc75
issue #1502 & issue #1540
dylanllim Nov 22, 2024
c00ab84
branch merge and test fixes
dylanllim Jan 28, 2025
bc4b659
merge
dylanllim Feb 5, 2025
3146712
Merge remote-tracking branch 'origin/master' into cpu-kernels-tests
dylanllim Feb 5, 2025
e71b6d7
build after merge
dylanllim Feb 5, 2025
311caf8
kernel issues
dylanllim Feb 8, 2025
157407d
managed stream / handle test case fix
dylanllim Feb 10, 2025
338fc8d
Merge remote-tracking branch 'origin/master' into cpu-kernels-tests
dylanllim Feb 10, 2025
35e43c6
test_utils update, kernel/ops refactor
dylanllim Feb 25, 2025
e5c607b
Merge remote-tracking branch 'origin/master' into dylan-cpu-kernels
lockshaw Mar 11, 2025
a07ed6c
Review fixes
lockshaw Mar 13, 2025
60cac9e
Update doctest includes in kernels
lockshaw Mar 17, 2025
0cff9b6
Merge remote-tracking branch 'origin/master' into dylan-cpu-kernels
lockshaw Mar 17, 2025
487773d
More PR review
lockshaw Mar 20, 2025
48b0096
Try using rhel package-based nixgl
lockshaw Mar 20, 2025
167485b
Format
lockshaw Mar 20, 2025
42efe35
Update proj with test command fixes
lockshaw Mar 21, 2025
8794542
Attempt to fix gpu CI
lockshaw Mar 21, 2025
72b9c6b
Use custom AMI in GPU CI
lockshaw Apr 22, 2025
af2fad1
Merge branch 'master' into cpu-kernels-tests
lockshaw Apr 22, 2025
4585912
Fix proj bug in cpu-ci
lockshaw Apr 22, 2025
4a1abc8
Try including run id
lockshaw Apr 22, 2025
4ea8c99
Temporarily allow gpu ci to run regardless for testing purposes
lockshaw Apr 22, 2025
692dde7
Merge remote-tracking branch 'origin/master' into dylan-cpu-kernels
lockshaw Apr 22, 2025
176b6d2
Try using official ubuntu ami in gpu ci
lockshaw Apr 22, 2025
68e7a48
Merge remote-tracking branch 'origin/master' into dylan-cpu-kernels
lockshaw Apr 23, 2025
11128cd
Try out new ami
lockshaw Apr 23, 2025
3982c87
Merge remote-tracking branch 'origin/master' into dylan-cpu-kernels
lockshaw Apr 23, 2025
07f3e27
Change to use new flexflow-gpu-ci AMI
lockshaw Apr 23, 2025
bb5e715
Fix bugs in GPU tests and restore GPU CI gating
lockshaw Apr 24, 2025
2a7afb2
Format
lockshaw Apr 24, 2025
56fc98c
Fix bug in accessor formatting test cases
lockshaw Apr 24, 2025
ce7cf83
Bugfixes and updated proj
lockshaw May 1, 2025
3fe8071
Merge remote-tracking branch 'origin/master' into dylan-cpu-kernels
lockshaw May 1, 2025
469f0a8
Fix all cpu tests
lockshaw May 2, 2025
c2a9712
Format
lockshaw May 2, 2025
e8b00cb
Add improved test failure output for replicate cpu vs gpu tests
lockshaw May 2, 2025
2886d0c
Continue debugging replicate cuda testcases
lockshaw May 2, 2025
7944e8c
Format
lockshaw May 2, 2025
de7d82c
Fix incorrect tensor size in replicate kernel tests
lockshaw May 2, 2025
252ae2d
Transpose replicate backward cpu kernel
lockshaw May 2, 2025
4fb76fe
Try flipping output dimensions in replica cuda kernel test
lockshaw May 2, 2025
69bc332
Update proj
lockshaw May 2, 2025
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
54 changes: 54 additions & 0 deletions .flake/pkgs/fccf/default.nix
Original file line number Diff line number Diff line change
@@ -0,0 +1,54 @@
{ fetchFromGitHub
, stdenv
, cmake
, pkg-config
, libclang
, libllvm
, lib
, zlib
, argparse
, nlohmann_json
, fmt
}:

stdenv.mkDerivation rec {
pname = "fccf";
version = "03d373fc65e2d7ceeac441ba4bbddfdc25618dff";

src = fetchFromGitHub {
owner = "p-ranav";
repo = "fccf";
rev = version;
sha256 = "sha256-3NdPon5ZfjoGFFgBlb0rzRnfWgSopvAc5Gls2NWHaOE=";
};

nativeBuildInputs = [
cmake
pkg-config
];

buildInputs = [
libclang
libllvm
zlib
argparse
nlohmann_json
fmt
];

patches = [
./json-package-name.patch
./fix-argparse-include.patch
];

cmakeFlags = [
"-DCMAKE_BUILD_TYPE=Release"
"-DFETCHCONTENT_TRY_FIND_PACKAGE_MODE=ALWAYS"
];

meta = with lib; {
description = "A command-line tool that quickly searches through C/C++ source code in a directory based on a search string and prints relevant code snippets that match the query";
homepage = "https://github.com/p-ranav/fccf";
license = licenses.mit;
};
}
13 changes: 13 additions & 0 deletions .flake/pkgs/fccf/fix-argparse-include.patch
Original file line number Diff line number Diff line change
@@ -0,0 +1,13 @@
diff --git a/source/main.cpp b/source/main.cpp
index 7e131d3..6c05d89 100644
--- a/source/main.cpp
+++ b/source/main.cpp
@@ -6,7 +6,7 @@
#include <string_view>
#include <vector>

-#include <argparse.hpp>
+#include <argparse/argparse.hpp>
#include <nlohmann/json.hpp>
#include "searcher.hpp"
#include <unistd.h>
12 changes: 12 additions & 0 deletions .flake/pkgs/fccf/json-package-name.patch
Original file line number Diff line number Diff line change
@@ -0,0 +1,12 @@
diff --git a/CMakeLists.txt b/CMakeLists.txt
index 20bcbbf..923075f 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -48,6 +48,7 @@ FetchContent_MakeAvailable(fmt)

FetchContent_Declare(json
URL https://github.com/nlohmann/json/releases/download/v3.10.5/json.tar.xz
+ FIND_PACKAGE_ARGS NAMES nlohmann_json
)
FetchContent_MakeAvailable(json)

19 changes: 0 additions & 19 deletions .github/runs-on.yml
Original file line number Diff line number Diff line change
@@ -1,23 +1,4 @@
images:
runs-on-gpu-pinned:
platform: "linux"
arch: "x64"
owner: "135269210855" # runs-on
# to find, go to
# https://us-east-2.console.aws.amazon.com/ec2/home?region=us-east-2#Images:visibility=public-images;search=:runs-on;v=3;$case=tags:false%5C,client:false;$regex=tags:false%5C,client:false
name: "runs-on-v2.2-ubuntu22-gpu-x64-20250220122045"

runs-on-cpu-pinned:
platform: "linux"
arch: "x64"
owner: "135269210855" # runs-on
name: "runs-on-v2.2-ubuntu22-full-x64-20250220122045"

official-ubuntu-ami:
platform: "linux"
arch: "x64"
ami: "ami-0a60b027285c0d4c5"

flexflow-gpu-ci:
platform: "linux"
arch: "x64"
Expand Down
4 changes: 2 additions & 2 deletions .github/workflows/tests.yml
Original file line number Diff line number Diff line change
Expand Up @@ -57,9 +57,9 @@ jobs:
name: GPU unit tests
needs: cpu-ci
runs-on:
- runs-on
- runs-on=${{ github.run_id }}
- family=g4dn.xlarge
- image=runs-on-gpu-pinned
- image=flexflow-gpu-ci

strategy:
max-parallel: 1
Expand Down
60 changes: 42 additions & 18 deletions .proj.toml
Original file line number Diff line number Diff line change
Expand Up @@ -2,57 +2,81 @@ project_name = "flexflow"
testsuite_macro = "FF_TEST_SUITE"
namespace_name = "FlexFlow"
header_extension = ".h"
cuda_launch_cmd = [
"nixGL",
"--",
]

[targets.utils]
type = "lib"
tests = true
benchmarks = true
has-cpu-only-tests = true
has-cpu-only-benchmarks = true
has-cuda-tests = false
has-cuda-benchmarks = false

[targets.op-attrs]
type = "lib"
tests = true
benchmarks = false
has-cpu-only-tests = true
has-cpu-only-benchmarks = false
has-cuda-tests = false
has-cuda-benchmarks = false

[targets.kernels]
type = "lib"
tests = true
benchmarks = false
has-cpu-only-tests = true
has-cpu-only-benchmarks = false
has-cuda-tests = true
has-cuda-benchmarks = false

[targets.pcg]
type = "lib"
tests = true
benchmarks = false
has-cpu-only-tests = true
has-cpu-only-benchmarks = false
has-cuda-tests = false
has-cuda-benchmarks = false

[targets.substitutions]
type = "lib"
tests = true
benchmarks = false
has-cpu-only-tests = true
has-cpu-only-benchmarks = false
has-cuda-tests = false
has-cuda-benchmarks = false

[targets.compiler]
type = "lib"
tests = true
benchmarks = true
has-cpu-only-tests = true
has-cpu-only-benchmarks = true
has-cuda-tests = false
has-cuda-benchmarks = false

[targets.substitution-generator]
type = "lib"
tests = true
benchmarks = false
has-cpu-only-tests = true
has-cpu-only-benchmarks = false
has-cuda-tests = false
has-cuda-benchmarks = false

[targets.local-execution]
type = "lib"
tests = true
benchmarks = false
has-cpu-only-tests = true
has-cpu-only-benchmarks = false
has-cuda-tests = false
has-cuda-benchmarks = false

[targets.models]
type = "lib"
tests = true
benchmarks = false
has-cpu-only-tests = true
has-cpu-only-benchmarks = false
has-cuda-tests = false
has-cuda-benchmarks = false

[targets.export-model-arch]
type = "bin"
cuda = false

[targets.substitution-to-dot]
type = "bin"
cuda = false

# default_build_targets = [
# "utils",
Expand Down
7 changes: 6 additions & 1 deletion cmake/flexflow-utils.cmake
Original file line number Diff line number Diff line change
Expand Up @@ -126,11 +126,16 @@ function(ff_add_test_executable)
${FF_TEST_EXEC_NAME}
${SRC})

target_include_directories(
${FF_TEST_EXEC_NAME}
PRIVATE
${FF_TEST_EXEC_PRIVATE_INCLUDE})

target_link_libraries(
${FF_TEST_EXEC_NAME}
${FF_TEST_EXEC_DEPS})

target_compile_definitions(${FF_TEST_EXEC_NAME} PRIVATE FF_TEST_SUITE="${FF_TEST_EXEC_NAME}" FF_CUDA_TEST_SUITE="cuda-${FF_TEST_EXEC_NAME}")
target_compile_definitions(${FF_TEST_EXEC_NAME} PRIVATE FF_TEST_SUITE="cpu-${FF_TEST_EXEC_NAME}" FF_CUDA_TEST_SUITE="cuda-${FF_TEST_EXEC_NAME}")

define_ff_vars(${FF_TEST_EXEC_NAME})
ff_set_cxx_properties(${FF_TEST_EXEC_NAME})
Expand Down
6 changes: 3 additions & 3 deletions flake.lock

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

3 changes: 3 additions & 0 deletions flake.nix
Original file line number Diff line number Diff line change
Expand Up @@ -59,6 +59,7 @@
bencher-cli = pkgs.callPackage ./.flake/pkgs/bencher-cli.nix { };
ffdb = pkgs.callPackage ./.flake/pkgs/ffdb { inherit proj; };
hpp2plantuml = pkgs.python3Packages.callPackage ./.flake/pkgs/hpp2plantuml.nix { };
fccf = pkgs.callPackage ./.flake/pkgs/fccf { };
rapidcheckFull = pkgs.symlinkJoin {
name = "rapidcheckFull";
paths = (with pkgs; [ rapidcheck.out rapidcheck.dev ]);
Expand Down Expand Up @@ -162,6 +163,7 @@
ruff
jq
gh
expect
])
(with pkgs.python3Packages; [
gitpython
Expand All @@ -179,6 +181,7 @@
(with self.packages.${system}; [
ffdb
hpp2plantuml
fccf
])
];
};
Expand Down
4 changes: 2 additions & 2 deletions lib/kernels/CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,7 @@ file(GLOB_RECURSE SRC
CONFIGURE_DEPENDS
LIST_DIRECTORIES False
src/*.cc
src/cuda/cuda_helper.cu
src/cuda/ops/*.cu
src/cuda/*.cu
)

add_library(
Expand All @@ -30,6 +29,7 @@ target_link_libraries(
cudnn
nccl
utils
pcg
)

define_ff_vars(${project_target})
Expand Down
Loading
Loading