powerpc: Introduce infrastructure for feature sections with alternatives
authorMichael Ellerman <michael@ellerman.id.au>
Tue, 24 Jun 2008 01:32:54 +0000 (11:32 +1000)
committerPaul Mackerras <paulus@samba.org>
Tue, 1 Jul 2008 01:28:28 +0000 (11:28 +1000)
The current feature section logic only supports nop'ing out code, this means
if you want to choose at runtime between instruction sequences, one or both
cases will have to execute the nop'ed out contents of the other section, eg:

BEGIN_FTR_SECTION
or 1,1,1
END_FTR_SECTION_IFSET(FOO)
BEGIN_FTR_SECTION
or 2,2,2
END_FTR_SECTION_IFCLR(FOO)

and the resulting code will be either,

or 1,1,1
nop

or,
nop
or 2,2,2

For small code segments this is fine, but for larger code blocks and in
performance criticial code segments, it would be nice to avoid the nops.
This commit starts to implement logic to allow the following:

BEGIN_FTR_SECTION
or 1,1,1
FTR_SECTION_ELSE
or 2,2,2
ALT_FTR_SECTION_END_IFSET(FOO)

and the resulting code will be:

or 1,1,1
or,
or 2,2,2

We achieve this by extending the existing FTR macros. The current feature
section semantic just becomes a special case, ie. if the else case is empty
we nop out the default case.

The key limitation is that the size of the else case must be less than or
equal to the size of the default case. If the else case is smaller the
remainder of the section is nop'ed.

We let the linker put the else case code in with the rest of the text,
so that relative branches from the else case are more likley to link,
this has the disadvantage that we can't free the unused else cases.

This commit introduces the required macro and linker script changes, but
does not enable the patching of the alternative sections.

We also need to update two hand-made section entries in reg.h and timex.h

Signed-off-by: Michael Ellerman <michael@ellerman.id.au>
Signed-off-by: Paul Mackerras <paulus@samba.org>
arch/powerpc/kernel/vdso32/vdso32.lds.S
arch/powerpc/kernel/vdso64/vdso64.lds.S
arch/powerpc/kernel/vmlinux.lds.S
arch/powerpc/lib/feature-fixups.c
include/asm-powerpc/feature-fixups.h
include/asm-powerpc/reg.h
include/asm-powerpc/timex.h

index 9352ab5200e591ba2a0b2cb551f125a2b29dc652..271793577cdc3c08d887940c2ee49033a488a7d2 100644 (file)
@@ -24,7 +24,7 @@ SECTIONS
 
        . = ALIGN(16);
        .text           : {
-               *(.text .stub .text.* .gnu.linkonce.t.*)
+               *(.text .stub .text.* .gnu.linkonce.t.* __ftr_alt_*)
        }
        PROVIDE(__etext = .);
        PROVIDE(_etext = .);
index 7d6585f902776dce82bebe7c018d46409101259c..e608d1bd3bff95ed6cb4e5cade70a84a4f241c7c 100644 (file)
@@ -24,7 +24,7 @@ SECTIONS
 
        . = ALIGN(16);
        .text           : {
-               *(.text .stub .text.* .gnu.linkonce.t.*)
+               *(.text .stub .text.* .gnu.linkonce.t.* __ftr_alt_*)
                *(.sfpr .glink)
        }                                               :text
        PROVIDE(__etext = .);
index 0c3000bf8d75d8919e20df3e44ba9a99d7bb7d14..3c07811989fc5317982a74b28e78749cb133a2dc 100644 (file)
@@ -35,7 +35,7 @@ SECTIONS
                ALIGN_FUNCTION();
                *(.text.head)
                _text = .;
-               *(.text .fixup .text.init.refok .exit.text.refok)
+               *(.text .fixup .text.init.refok .exit.text.refok __ftr_alt_*)
                SCHED_TEXT
                LOCK_TEXT
                KPROBES_TEXT
index f6fd5d2ff10deb14d2e9741c30c2eda40f338af8..973d547ef01d5b1986f8bd6b14de97c8f9e17a6d 100644 (file)
@@ -22,6 +22,8 @@ struct fixup_entry {
        unsigned long   value;
        long            start_off;
        long            end_off;
+       long            alt_start_off;
+       long            alt_end_off;
 };
 
 static void patch_feature_section(unsigned long value, struct fixup_entry *fcur)
index 35f927888fe8a074b05accbb9120f2ba42fb071c..ab30129dced7404e84cb0d0158b2a5fc247dd9b0 100644 (file)
 #define FTR_ENTRY_OFFSET       PPC_LONG
 #endif
 
+#define START_FTR_SECTION(label)       label##1:
+
+#define FTR_SECTION_ELSE_NESTED(label)                 \
+label##2:                                              \
+       .pushsection __ftr_alt_##label,"a";             \
+       .align 2;                                       \
+label##3:
+
 #define MAKE_FTR_SECTION_ENTRY(msk, val, label, sect)  \
-99:                                                    \
-       .section sect,"a";                              \
+label##4:                                              \
+       .popsection;                                    \
+       .pushsection sect,"a";                          \
        .align 3;                                       \
-98:                                                    \
+label##5:                                              \
        FTR_ENTRY_LONG msk;                             \
        FTR_ENTRY_LONG val;                             \
-       FTR_ENTRY_OFFSET label##b-98b;                  \
-       FTR_ENTRY_OFFSET 99b-98b;                       \
-       .previous
-
+       FTR_ENTRY_OFFSET label##1b-label##5b;           \
+       FTR_ENTRY_OFFSET label##2b-label##5b;           \
+       FTR_ENTRY_OFFSET label##3b-label##5b;           \
+       FTR_ENTRY_OFFSET label##4b-label##5b;           \
+       .popsection;
 
 
 /* CPU feature dependent sections */
-#define BEGIN_FTR_SECTION_NESTED(label)        label:
-#define BEGIN_FTR_SECTION              BEGIN_FTR_SECTION_NESTED(97)
+#define BEGIN_FTR_SECTION_NESTED(label)        START_FTR_SECTION(label)
+#define BEGIN_FTR_SECTION              START_FTR_SECTION(97)
 
-#define END_FTR_SECTION_NESTED(msk, val, label) \
+#define END_FTR_SECTION_NESTED(msk, val, label)                \
+       FTR_SECTION_ELSE_NESTED(label)                          \
        MAKE_FTR_SECTION_ENTRY(msk, val, label, __ftr_fixup)
 
 #define END_FTR_SECTION(msk, val)              \
 #define END_FTR_SECTION_IFSET(msk)     END_FTR_SECTION((msk), (msk))
 #define END_FTR_SECTION_IFCLR(msk)     END_FTR_SECTION((msk), 0)
 
+/* CPU feature sections with alternatives, use BEGIN_FTR_SECTION to start */
+#define FTR_SECTION_ELSE       FTR_SECTION_ELSE_NESTED(97)
+#define ALT_FTR_SECTION_END_NESTED(msk, val, label)    \
+       MAKE_FTR_SECTION_ENTRY(msk, val, label, __ftr_fixup)
+#define ALT_FTR_SECTION_END_NESTED_IFSET(msk, label)   \
+       ALT_FTR_SECTION_END_NESTED(msk, msk, label)
+#define ALT_FTR_SECTION_END_NESTED_IFCLR(msk, label)   \
+       ALT_FTR_SECTION_END_NESTED(msk, 0, label)
+#define ALT_FTR_SECTION_END(msk, val)  \
+       ALT_FTR_SECTION_END_NESTED(msk, val, 97)
+#define ALT_FTR_SECTION_END_IFSET(msk) \
+       ALT_FTR_SECTION_END_NESTED_IFSET(msk, 97)
+#define ALT_FTR_SECTION_END_IFCLR(msk) \
+       ALT_FTR_SECTION_END_NESTED_IFCLR(msk, 97)
 
 /* Firmware feature dependent sections */
-#define BEGIN_FW_FTR_SECTION_NESTED(label)     label:
-#define BEGIN_FW_FTR_SECTION                   BEGIN_FW_FTR_SECTION_NESTED(97)
+#define BEGIN_FW_FTR_SECTION_NESTED(label)     START_FTR_SECTION(label)
+#define BEGIN_FW_FTR_SECTION                   START_FTR_SECTION(97)
 
-#define END_FW_FTR_SECTION_NESTED(msk, val, label) \
+#define END_FW_FTR_SECTION_NESTED(msk, val, label)             \
+       FTR_SECTION_ELSE_NESTED(label)                          \
        MAKE_FTR_SECTION_ENTRY(msk, val, label, __fw_ftr_fixup)
 
 #define END_FW_FTR_SECTION(msk, val)           \
 #define END_FW_FTR_SECTION_IFSET(msk)  END_FW_FTR_SECTION((msk), (msk))
 #define END_FW_FTR_SECTION_IFCLR(msk)  END_FW_FTR_SECTION((msk), 0)
 
+/* Firmware feature sections with alternatives */
+#define FW_FTR_SECTION_ELSE_NESTED(label)      FTR_SECTION_ELSE_NESTED(label)
+#define FW_FTR_SECTION_ELSE    FTR_SECTION_ELSE_NESTED(97)
+#define ALT_FW_FTR_SECTION_END_NESTED(msk, val, label) \
+       MAKE_FTR_SECTION_ENTRY(msk, val, label, __fw_ftr_fixup)
+#define ALT_FW_FTR_SECTION_END_NESTED_IFSET(msk, label)        \
+       ALT_FW_FTR_SECTION_END_NESTED(msk, msk, label)
+#define ALT_FW_FTR_SECTION_END_NESTED_IFCLR(msk, label)        \
+       ALT_FW_FTR_SECTION_END_NESTED(msk, 0, label)
+#define ALT_FW_FTR_SECTION_END(msk, val)       \
+       ALT_FW_FTR_SECTION_END_NESTED(msk, val, 97)
+#define ALT_FW_FTR_SECTION_END_IFSET(msk)      \
+       ALT_FW_FTR_SECTION_END_NESTED_IFSET(msk, 97)
+#define ALT_FW_FTR_SECTION_END_IFCLR(msk)      \
+       ALT_FW_FTR_SECTION_END_NESTED_IFCLR(msk, 97)
+
 #endif /* __ASSEMBLY__ */
 
 #endif /* __ASM_POWERPC_FEATURE_FIXUPS_H */
index 079999b032af02483e00a950cb9be9f18bb4843d..7256efb5c140c4f22285745c873318a4e953b12b 100644 (file)
                                "       .llong %1\n"                    \
                                "       .llong 97b-98b\n"               \
                                "       .llong 99b-98b\n"               \
+                               "       .llong 0\n"                     \
+                               "       .llong 0\n"                     \
                                ".previous"                             \
                        : "=r" (rval) : "i" (CPU_FTR_CELL_TB_BUG)); rval;})
 #else
index 92dedde761d183a0109dfd7173c37ec1f3a1d43b..c55e14f7ef445486ccb2ba9c938934706ce2be0d 100644 (file)
@@ -38,6 +38,8 @@ static inline cycles_t get_cycles(void)
                "       .long 0\n"
                "       .long 97b-98b\n"
                "       .long 99b-98b\n"
+               "       .long 0\n"
+               "       .long 0\n"
                ".previous"
                : "=r" (ret) : "i" (CPU_FTR_601));
        return ret;