April 8, 2025 11:41 · April 8, 2025 08:39 · April 8, 2025 08:37 · April 2, 2025 11:38 · March 29, 2025 13:07 · March 28, 2025 06:10
 #include <cuda_runtime.h>
 #include <iostream>
 #include <chrono>

 #define CHECK_CUDA(call) \
    if ((call) != cudaSuccess) { \
        std::cerr << "CUDA error at " << __FILE__ << ":" << __LINE__ << std::endl; \
        std::exit(1); \
    }
 #include <cuda_runtime.h>
 #include <iostream>
 #include <chrono>

 #define CHECK_CUDA(call)                                                       \
    do {                                                                       \
        cudaError_t err = call;                                                \
        if (err != cudaSuccess) {                                              \
            std::cerr << "CUDA Error: " << cudaGetErrorString(err) << "\n";   \
            exit(EXIT_FAILURE);                                                \
 #include <cuda_runtime.h>
 #include <iostream>
 #include <chrono>

 #define CHECK_CUDA(call)                                                       \
    do {                                                                       \
        cudaError_t err = call;                                                \
        if (err != cudaSuccess) {                                              \
            std::cerr << "CUDA Error: " << cudaGetErrorString(err) << "\n";   \
            exit(EXIT_FAILURE);                                                \
 12,13c12,15
 < #include "ggml-cpu/unary-ops.h"
 < #include "ggml-cpu/binary-ops.h"
 ---
 > #include "unary-ops.h"
 > #include "binary-ops.h"
 > #include "vec.h"
 > #include "ops.h"
 86,109d87
 < #if defined(GGML_USE_ACCELERATE)
 diff --git a/ops.cpp b/ops.cpp
 index 6190d0d..c44157b 100644
 --- a/ops.cpp
 +++ b/ops.cpp
 @@ -2347,7 +2347,7 @@ static void ggml_compute_forward_repeat_back_f32(
     GGML_ASSERT(nb00 == sizeof(float));
 
     if (ggml_is_contiguous(dst)) {
 -        ggml_vec_set_f32(ne0*ne1*ne2*ne3, dst->data, 0);
 +        ggml_vec_set_f32(ne0*ne1*ne2*ne3, (float *)dst->data, 0);
 11a12,13
 > #include "ggml-cpu/unary-ops.h"
 > #include "ggml-cpu/binary-ops.h"
 4292,4625d4293
 < static void ggml_compute_forward_add_f32(
 <         const struct ggml_compute_params * params,
 <         struct ggml_tensor * dst) {
 < 
 <     const struct ggml_tensor * src0 = dst->src[0];
 <     const struct ggml_tensor * src1 = dst->src[1];
 #include "ggml.h"
 #include "ggml-cpu.h"

 #ifdef GGML_USE_CUDA
 #include "ggml-cuda.h"
 #endif

 #include <vector>
 #include <iostream>
 #include <chrono>
 #include "ggml.h"
 #include "ggml-cpu.h"

 #ifdef GGML_USE_CUDA
 #include "ggml-cuda.h"
 #endif

 #include <vector>
 #include <iostream>
 #include <chrono>
 #include "ggml.h"
 #include "ggml-cpu.h"

 #ifdef GGML_USE_CUDA
 #include "ggml-cuda.h"
 #endif

 #include <vector>
 #include <iostream>
 import pefile
 import sys

 if len(sys.argv) < 2:
    print("Error: No file path specified. Usage: python hexdump.py <file_path>")
    sys.exit(1)

 file_path = sys.argv[1]

 try:
	#include <cuda_runtime.h>
	#include <iostream>
	#include <chrono>

	#define CHECK_CUDA(call) \
	if ((call) != cudaSuccess) { \
	std::cerr << "CUDA error at " << __FILE__ << ":" << __LINE__ << std::endl; \
	std::exit(1); \
	}
	12,13c12,15
	< #include "ggml-cpu/unary-ops.h"
	< #include "ggml-cpu/binary-ops.h"
	---
	> #include "unary-ops.h"
	> #include "binary-ops.h"
	> #include "vec.h"
	> #include "ops.h"
	86,109d87
	< #if defined(GGML_USE_ACCELERATE)
	diff --git a/ops.cpp b/ops.cpp
	index 6190d0d..c44157b 100644
	--- a/ops.cpp
	+++ b/ops.cpp
	@@ -2347,7 +2347,7 @@ static void ggml_compute_forward_repeat_back_f32(
	GGML_ASSERT(nb00 == sizeof(float));

	if (ggml_is_contiguous(dst)) {
	- ggml_vec_set_f32(ne0ne1ne2*ne3, dst->data, 0);
	+ ggml_vec_set_f32(ne0ne1ne2ne3, (float )dst->data, 0);
	11a12,13
	> #include "ggml-cpu/unary-ops.h"
	> #include "ggml-cpu/binary-ops.h"
	4292,4625d4293
	< static void ggml_compute_forward_add_f32(
	< const struct ggml_compute_params * params,
	< struct ggml_tensor * dst) {
	<
	< const struct ggml_tensor * src0 = dst->src[0];
	< const struct ggml_tensor * src1 = dst->src[1];
	#include "ggml.h"
	#include "ggml-cpu.h"

	#ifdef GGML_USE_CUDA
	#include "ggml-cuda.h"
	#endif

	#include <vector>
	#include <iostream>
	#include <chrono>
	import pefile
	import sys

	if len(sys.argv) < 2:
	print("Error: No file path specified. Usage: python hexdump.py <file_path>")
	sys.exit(1)

	file_path = sys.argv[1]

	try: