File size: 3,049 Bytes
055eba4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
// Copyright 2024 Google LLC
// SPDX-License-Identifier: Apache-2.0
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     https://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "backprop/forward.h"

#include "backprop/prompt.h"
#include "gemma/activations.h"
#include "gemma/common.h"
#include "hwy/contrib/thread_pool/thread_pool.h"

// Compiles this file for multiple architectures via "foreach_target.h", to
// which we pass the filename via macro 'argument'.
#undef HWY_TARGET_INCLUDE
#define HWY_TARGET_INCLUDE "backprop/forward.cc"  // NOLINT
#include "hwy/foreach_target.h"        // IWYU pragma: keep

#include "hwy/highway.h"
// After highway.h
#include "backprop/forward-inl.h"
#include "gemma/weights.h"

HWY_BEFORE_NAMESPACE();
namespace gcpp {
namespace HWY_NAMESPACE {

template <typename TConfig>
float CrossEntropyLossForwardPass(const Prompt& prompt,
                                  const ByteStorageT& weights_u8,
                                  ByteStorageT& forward_u8,
                                  hwy::ThreadPool& pool) {
  const auto& weights =
      *reinterpret_cast<CompressedWeights<TConfig>*>(weights_u8.get());
  auto& forward =
      *reinterpret_cast<ForwardPass<float, TConfig>*>(forward_u8.get());
  return
      CrossEntropyLossForwardPass<TConfig, CompressedWeights, CompressedLayer>(
          prompt.tokens, prompt.context_size, weights, forward, pool);
}

float CrossEntropyLossForwardPassT(Model model, const Prompt& prompt,
                                   const ByteStorageT& weights,
                                   ByteStorageT& forward,
                                   hwy::ThreadPool& pool) {
  // TODO(janwas): use CallFunctorForModel
  switch (model) {
    case Model::GEMMA_2B:
      return CrossEntropyLossForwardPass<ConfigGemma2B<float>>(prompt, weights,
                                                               forward, pool);
    case Model::GEMMA_TINY:
      return CrossEntropyLossForwardPass<ConfigGemmaTiny<float>>(
          prompt, weights, forward, pool);
    default:
      HWY_ABORT("Model type %d unknown.", static_cast<int>(model));
  }
}

}  // namespace HWY_NAMESPACE
}  // namespace gcpp
HWY_AFTER_NAMESPACE();

#if HWY_ONCE
namespace gcpp {

HWY_EXPORT(CrossEntropyLossForwardPassT);

float CrossEntropyLossForwardPass(
    const Model& model, const Prompt& prompt, const ByteStorageT& weights,
    ByteStorageT& forward, hwy::ThreadPool& pool) {
  return HWY_DYNAMIC_DISPATCH(CrossEntropyLossForwardPassT)(
      model, prompt, weights, forward, pool);
}

}  // namespace gcpp
#endif  // HWY_ONCE