File: attr_fastmath_x86.d

package info (click to toggle)
ldc 1%3A1.24.0-2
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 53,728 kB
  • sloc: cpp: 55,939; ansic: 10,599; sh: 958; makefile: 801; asm: 507; objc: 122; exp: 30; python: 12
file content (21 lines) | stat: -rw-r--r-- 487 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
// Test vectorized fused multiply-add in a simple dot product routine

// REQUIRES: target_X86

// RUN: %ldc -mtriple=x86_64-linux-gnu -mattr=+fma -O3 -release -c -output-s -of=%t.s %s && FileCheck %s --check-prefix ASM < %t.s

import ldc.attributes;

// ASM-LABEL: dot:
@fastmath
extern (C) double dot(double[] a, double[] b)
{
    double s = 0;
// ASM: vfmadd{{[123][123][123]}}pd
    foreach (size_t i; 0 .. a.length)
    {
        s += a[i] * b[i];
    }
    return s;
// ASM: ret
}