RET_P(p);
}
+#define BA_ALIGN 16
+#define BA_MASK (BA_ALIGN-1)
+
newPinnedByteArrayzh_fast
{
W_ words, payload_words, n, p;
n = R1;
payload_words = ROUNDUP_BYTES_TO_WDS(n);
- // We want a 16-byte aligned array. allocatePinned() gives us
+ words = payload_words + ((SIZEOF_StgArrWords + BA_MASK) & ~BA_MASK);
+
+ ("ptr" p) = foreign "C" allocatePinned(words) [];
+ TICK_ALLOC_PRIM(SIZEOF_StgArrWords,WDS(payload_words),0);
+
+ // This bumps p forwards so that the payload falls on an R2-byte boundary.
+ p = p + ((-p - SIZEOF_StgArrWords) & BA_MASK);
+
+ SET_HDR(p, stg_ARR_WORDS_info, W_[CCCS]);
+ StgArrWords_words(p) = payload_words;
+ RET_P(p);
+}
+
+newAlignedPinnedByteArrayzh_fast
+{
+ W_ words, payload_words, n, p, mask;
+
+ MAYBE_GC(NO_PTRS,newAlignedPinnedByteArrayzh_fast);
+ n = R1;
+
+ if (R2 > SIZEOF_W) {
+ mask = R2 - 1;
+ } else {
+ mask = 0;
+ }
+
+ payload_words = ROUNDUP_BYTES_TO_WDS(n);
+
+ // We want an <align>-byte aligned array. allocatePinned() gives us
// 8-byte aligned memory by default, but we want to align the
// *goods* inside the ArrWords object, so we have to check the
// size of the ArrWords header and adjust our size accordingly.
- words = payload_words + ((SIZEOF_StgArrWords + 15) & ~15);
+ words = payload_words + ((SIZEOF_StgArrWords + mask) & ~mask);
("ptr" p) = foreign "C" allocatePinned(words) [];
TICK_ALLOC_PRIM(SIZEOF_StgArrWords,WDS(payload_words),0);
- // Push the pointer forward so that the goods fall on a 16-byte boundary.
- p = p + ((p + SIZEOF_StgArrWords) & 15);
+ // This bumps p forwards so that the payload falls on an R2-byte boundary.
+ p = p + ((-p - SIZEOF_StgArrWords) & mask);
SET_HDR(p, stg_ARR_WORDS_info, W_[CCCS]);
StgArrWords_words(p) = payload_words;