Skip to content

Commit 2ce0ce8

Browse files
authored
Merge pull request #586 from ThePortlandGroup/nv_stage
Pull 2018-09-12T15-41 Recent NVIDIA Changes
2 parents 0a33213 + 0679b2f commit 2ce0ce8

File tree

22 files changed

+174
-178
lines changed

22 files changed

+174
-178
lines changed

runtime/libpgmath/lib/common/arm64intrin.h

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2608,7 +2608,7 @@ _mm_min_sd(const __m128d& a, const __m128d& b)
26082608
{
26092609
double aa = vec_extract(a, 0);
26102610
double bb = vec_extract(b, 0);
2611-
aa < bb ? aa : bb;
2611+
aa = aa < bb ? aa : bb;
26122612
return vec_insert(aa, a, 0);
26132613
}
26142614

@@ -2618,7 +2618,7 @@ _mm_max_sd(const __m128d& a, const __m128d& b)
26182618
{
26192619
double aa = vec_extract(a, 0);
26202620
double bb = vec_extract(b, 0);
2621-
aa > bb ? aa : bb;
2621+
aa = aa > bb ? aa : bb;
26222622
return vec_insert(aa, a, 0);
26232623
}
26242624

runtime/libpgmath/lib/common/log/fma3/fdlog1.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -36,7 +36,7 @@ __m128d __internal_fast_int2dbl(__m128i a)
3636
__m128d const INT2DBL = (__m128d)_mm_set1_epi64x(INT2DBL_D);
3737

3838
__m128i t = _mm_xor_si128(INT2DBL_LO, a);
39-
t = _mm_blend_epi32(INT2DBL_HI, t, H55_D);
39+
t = _mm_blend_epi32(INT2DBL_HI, t, 0x5);
4040
return _mm_sub_sd((__m128d)t, INT2DBL);
4141
}
4242

runtime/libpgmath/lib/common/log/fma3/fdlog2.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -36,7 +36,7 @@ __m128d __internal_fast_int2dbl(__m128i a)
3636
__m128d const INT2DBL = (__m128d)_mm_set1_epi64x(INT2DBL_D);
3737

3838
__m128i t = _mm_xor_si128(INT2DBL_LO, a);
39-
t = _mm_blend_epi32(INT2DBL_HI, t, H55_D);
39+
t = _mm_blend_epi32(INT2DBL_HI, t, 0x5);
4040
return _mm_sub_pd((__m128d)t, INT2DBL);
4141
}
4242

runtime/libpgmath/lib/common/log/fma3/fdlog4.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@ __m256d __internal_fast_int2dbl(__m256i a)
3535
__m256d const INT2DBL = (__m256d)_mm256_set1_epi64x(INT2DBL_D);
3636

3737
__m256i t = _mm256_xor_si256(INT2DBL_LO, a);
38-
t = _mm256_blend_epi32(INT2DBL_HI, t, H55_D);
38+
t = _mm256_blend_epi32(INT2DBL_HI, t, 0x55);
3939
return _mm256_sub_pd((__m256d)t, INT2DBL);
4040
}
4141

runtime/libpgmath/lib/common/log/fma3/fdlog8.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@ __m512d __internal_fast_int2dbl(__m512i a)
3737
__m512d const INT2DBL = (__m512d)_mm512_set1_epi64(INT2DBL_D);
3838

3939
__m512i t = _mm512_xor_si512(INT2DBL_LO, a);
40-
t = _mm512_mask_blend_epi32((H55_D<<8)|H55_D, INT2DBL_HI, t);
40+
t = _mm512_mask_blend_epi32(0x5555, INT2DBL_HI, t);
4141
return _mm512_sub_pd((__m512d)t, INT2DBL);
4242
}
4343

runtime/libpgmath/lib/common/log/fma3/fdlog_defs.h

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
/*
2-
* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
2+
* Copyright (c) 2017-2018, NVIDIA CORPORATION. All rights reserved.
33
*
44
* Licensed under the Apache License, Version 2.0 (the "License");
55
* you may not use this file except in compliance with the License.
@@ -20,8 +20,6 @@
2020
#define INT2DBL_LO_D 0x0000000080000000
2121
#define INT2DBL_D 0x4330000080000000
2222

23-
#define H55_D 0x55
24-
2523
#define ZERO_D 0.0
2624
#define ALL_ONES_EXPONENT_D 0x7FF0000000000000
2725
#define NAN_VAL_D 0xFFF8000000000000

tools/flang1/flang1exe/symacc.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -181,7 +181,7 @@ typedef struct {
181181
const char *ocnames[OC_MAX + 1];
182182
const char *scnames[SC_MAX + 1];
183183
const char *tynames[TY_MAX + 1];
184-
int i0, i1;
184+
SPTR i0, i1;
185185
int k0, k1;
186186
SPTR flt0, dbl0, quad0;
187187
SPTR fltm0, dblm0, quadm0; /* floating point minus 0 */

0 commit comments

Comments
 (0)