1/*
2 * Licensed to the Apache Software Foundation (ASF) under one
3 * or more contributor license agreements. See the NOTICE file
4 * distributed with this work for additional information
5 * regarding copyright ownership. The ASF licenses this file
6 * to you under the Apache License, Version 2.0 (the
7 * "License"); you may not use this file except in compliance
8 * with the License. You may obtain a copy of the License at
9 *
10 * http://www.apache.org/licenses/LICENSE-2.0
11 *
12 * Unless required by applicable law or agreed to in writing,
13 * software distributed under the License is distributed on an
14 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
15 * KIND, either express or implied. See the License for the
16 * specific language governing permissions and limitations
17 * under the License.
18 */
19
20/*!
21 * \file x86/injective.h
22 * \brief x86 schedule for injective ops
23 */
24#ifndef TVM_TOPI_X86_INJECTIVE_H_
25#define TVM_TOPI_X86_INJECTIVE_H_
26
27#include <tvm/target/generic_func.h>
28#include <tvm/te/operation.h>
29#include <tvm/topi/detail/fuse.h>
30#include <tvm/topi/tags.h>
31
32namespace tvm {
33namespace topi {
34
35using namespace tvm::te;
36
37namespace x86 {
38
39/*!
40 * \brief Updates an existing schedule for the given injective ops.
41 *
42 * \param sch The schedule to update.
43 * \param out The tensor representing the injective op.
44 *
45 * \return The updated schedule.
46 */
47inline Schedule schedule_injective_from_existing(Schedule sch, const Tensor& out) {
48 auto axis = sch[out]->op.as<ComputeOpNode>()->axis;
49 if (axis.size() == 4) {
50 auto n = axis[0];
51 auto c = axis[1];
52 auto fused = detail::Fuse(sch[out], {n, c}); // for nhwc layout, fuse n and h
53 sch[out].parallel(fused);
54 } else {
55 sch[out].parallel(axis[0]);
56 }
57 return sch;
58}
59
60/*!
61 * \brief Create an x86 schedule for the given injective ops.
62 *
63 * \param target The target to generate a schedule for.
64 * \param outs The output tensors.
65 *
66 * \return A schedule for the given ops.
67 */
68inline Schedule schedule_injective(const Target& target, const Array<Tensor>& outs) {
69 Array<Operation> out_ops;
70 for (auto t : outs) {
71 out_ops.push_back(t->op);
72 }
73 auto s = create_schedule(out_ops);
74 tvm::te::AutoInlineInjective(s);
75
76 auto x = outs[0];
77 schedule_injective_from_existing(s, x);
78
79 return s;
80}
81
82} // namespace x86
83} // namespace topi
84} // namespace tvm
85#endif // TVM_TOPI_X86_INJECTIVE_H_
86