/* ****************************************************************************** * * * This program and the accompanying materials are made available under the * terms of the Apache License, Version 2.0 which is available at * https://www.apache.org/licenses/LICENSE-2.0. * * See the NOTICE file distributed with this work for additional * information regarding copyright ownership. * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the * License for the specific language governing permissions and limitations * under the License. * * SPDX-License-Identifier: Apache-2.0 ******************************************************************************/ // // @author raver119@gmail.com // #include #include #include namespace sd { namespace ops { namespace helpers { static Nd4jLong hamming_distance(unsigned long long x, unsigned long long y) { Nd4jLong dist = 0; for (unsigned long long val = x ^ y; val > 0; val /= 2) { if (val & 1) dist++; } return dist; } template static void _hamming(NDArray &x, NDArray &y, NDArray &z) { auto xEws = x.ews(); auto yEws = y.ews(); auto xBuffer = x.bufferAsT(); auto yBuffer = y.bufferAsT(); Nd4jLong distance = 0; auto lengthOf = x.lengthOf(); int maxThreads = sd::math::nd4j_min(256, omp_get_max_threads()); Nd4jLong intermediate[256]; // nullify temp values for (int e = 0; e < maxThreads; e++) intermediate[e] = 0; if (xEws == 1 && yEws == 1 && x.ordering() == y.ordering()) { auto func = PRAGMA_THREADS_FOR { for (auto e = start; e < stop; e++) { auto _x = static_cast(xBuffer[e]); auto _y = static_cast(yBuffer[e]); intermediate[thread_id] += hamming_distance(_x, _y); } }; maxThreads = samediff::Threads::parallel_for(func, 0, lengthOf); } else if (xEws > 1 && yEws > 1 && x.ordering() == y.ordering()) { auto func = PRAGMA_THREADS_FOR { for (auto e = start; e < stop; e++) { auto _x = static_cast(xBuffer[e * xEws]); auto _y = static_cast(yBuffer[e * yEws]); intermediate[thread_id] += hamming_distance(_x, _y); } }; maxThreads = samediff::Threads::parallel_for(func, 0, lengthOf); } else { auto func = PRAGMA_THREADS_FOR { for (auto e = start; e < stop; e++) { auto _x = static_cast(x.e(e)); auto _y = static_cast(y.e(e)); intermediate[thread_id] += hamming_distance(_x, _y); } }; maxThreads = samediff::Threads::parallel_for(func, 0, lengthOf); } // accumulate intermediate variables into output array for (int e = 0; e < maxThreads; e++) distance += intermediate[e]; z.p(0, distance); } void hamming(LaunchContext *context, NDArray &x, NDArray &y, NDArray &output) { BUILD_DOUBLE_SELECTOR(x.dataType(), output.dataType(), _hamming, (x, y, output), INTEGER_TYPES, INDEXING_TYPES); } } } }