Message ID | 20130208154809.GF3495@mudshark.cambridge.arm.com (mailing list archive) |
---|---|
State | New, archived |
Headers | show |
Am 08.02.2013 16:48, schrieb Will Deacon: > On Wed, Feb 06, 2013 at 11:01:23PM +0000, André Hentschel wrote: >> Am 06.02.2013 23:51, schrieb Russell King - ARM Linux: >>> On Wed, Feb 06, 2013 at 11:43:10PM +0100, André Hentschel wrote: >>>> There are more and more applications coming to WinRT, Wine could support them, >>>> but mostly they expect to have the thread environment block (TEB) in TPIDRURW. >>>> This register must be preserved per thread instead of being cleared. >>> >>> I'd prefer this was done a little more sensitively to those CPUs where >>> loads/stores are expensive, namely: >>> >>>> + >>>> + @ preserve TPIDRURW register state >>>> + get_tls2 r3, r4, r5 >>>> + str r3, [r1, #TI_TP2_VALUE] >>>> + ldr r3, [r2, #TI_TP2_VALUE] >>>> + set_tls2 r3, r4, r5 >>> >>> those two loads/stores get omitted from the thread switching if the CPU >>> doesn't support it. Do you think that's something you could do? >> >> No, i'm not sure how to improve this. How does the process can continue, can you or someone else fix that and add his Signed-off-by? > > How about something like the (completely untested) diff below? > > Andre: if this works for you, I'm happy to write a commit message etc. > > Cheers, > > Will > > --->8 I'll try the next days and report back, thx.
Am 08.02.2013 16:48, schrieb Will Deacon: > On Wed, Feb 06, 2013 at 11:01:23PM +0000, André Hentschel wrote: >> Am 06.02.2013 23:51, schrieb Russell King - ARM Linux: >>> On Wed, Feb 06, 2013 at 11:43:10PM +0100, André Hentschel wrote: >>>> There are more and more applications coming to WinRT, Wine could support them, >>>> but mostly they expect to have the thread environment block (TEB) in TPIDRURW. >>>> This register must be preserved per thread instead of being cleared. >>> >>> I'd prefer this was done a little more sensitively to those CPUs where >>> loads/stores are expensive, namely: >>> >>>> + >>>> + @ preserve TPIDRURW register state >>>> + get_tls2 r3, r4, r5 >>>> + str r3, [r1, #TI_TP2_VALUE] >>>> + ldr r3, [r2, #TI_TP2_VALUE] >>>> + set_tls2 r3, r4, r5 >>> >>> those two loads/stores get omitted from the thread switching if the CPU >>> doesn't support it. Do you think that's something you could do? >> >> No, i'm not sure how to improve this. How does the process can continue, can you or someone else fix that and add his Signed-off-by? > > How about something like the (completely untested) diff below? > > Andre: if this works for you, I'm happy to write a commit message etc. > > Cheers, > > Will Thx for your effort, but it doesn't work, at least not with my 3.4.6 suse kernel. Be free to have another try, i'll be happy to test it. > --->8 > > diff --git a/arch/arm/include/asm/thread_info.h b/arch/arm/include/asm/thread_info.h > index cddda1f..d90be6d 100644 > --- a/arch/arm/include/asm/thread_info.h > +++ b/arch/arm/include/asm/thread_info.h > @@ -58,7 +58,7 @@ struct thread_info { > struct cpu_context_save cpu_context; /* cpu context */ > __u32 syscall; /* syscall number */ > __u8 used_cp[16]; /* thread used copro */ > - unsigned long tp_value; > + unsigned long tp_value[2]; /* TLS registers */ > #ifdef CONFIG_CRUNCH > struct crunch_state crunchstate; > #endif > diff --git a/arch/arm/include/asm/tls.h b/arch/arm/include/asm/tls.h > index 73409e6..e1b09d32 100644 > --- a/arch/arm/include/asm/tls.h > +++ b/arch/arm/include/asm/tls.h > @@ -6,9 +6,9 @@ > .endm > > .macro set_tls_v6k, tp, tmp1, tmp2 > - mcr p15, 0, \tp, c13, c0, 3 @ set TLS register > - mov \tmp1, #0 > - mcr p15, 0, \tmp1, c13, c0, 2 @ clear user r/w TLS register > + ldrd \tmp1, \tmp2, [\tp] > + mcr p15, 0, \tmp1, c13, c0, 3 @ set user r/o TLS register > + mcr p15, 0, \tmp2, c13, c0, 2 @ set user r/w TLS register > .endm > > .macro set_tls_v6, tp, tmp1, tmp2 > @@ -16,15 +16,17 @@ > ldr \tmp1, [\tmp1, #0] > mov \tmp2, #0xffff0fff > tst \tmp1, #HWCAP_TLS @ hardware TLS available? > - mcrne p15, 0, \tp, c13, c0, 3 @ yes, set TLS register > - movne \tmp1, #0 > - mcrne p15, 0, \tmp1, c13, c0, 2 @ clear user r/w TLS register > - streq \tp, [\tmp2, #-15] @ set TLS value at 0xffff0ff0 > + ldrdne \tmp1, \tmp2, [\tp] > + ldreq \tmp1, [\tp] > + mcrne p15, 0, \tmp1, c13, c0, 3 @ yes, set user r/o TLS register > + mcrne p15, 0, \tmp2, c13, c0, 2 @ set user r/w TLS register > + streq \tmp1, [\tmp2, #-15] @ set TLS value at 0xffff0ff0 > .endm > > .macro set_tls_software, tp, tmp1, tmp2 > - mov \tmp1, #0xffff0fff > - str \tp, [\tmp1, #-15] @ set TLS value at 0xffff0ff0 > + ldr \tmp1, [\tp] > + mov \tmp2, #0xffff0fff > + str \tmp1, [\tmp2, #-15] @ set TLS value at 0xffff0ff0 > .endm > #endif > > diff --git a/arch/arm/kernel/entry-armv.S b/arch/arm/kernel/entry-armv.S > index 0f82098..a0a8fe3 100644 > --- a/arch/arm/kernel/entry-armv.S > +++ b/arch/arm/kernel/entry-armv.S > @@ -728,7 +728,7 @@ ENTRY(__switch_to) > UNWIND(.fnstart ) > UNWIND(.cantunwind ) > add ip, r1, #TI_CPU_SAVE > - ldr r3, [r2, #TI_TP_VALUE] > + add r3, r2, #TI_TP_VALUE > ARM( stmia ip!, {r4 - sl, fp, sp, lr} ) @ Store most regs on stack > THUMB( stmia ip!, {r4 - sl, fp} ) @ Store most regs on stack > THUMB( str sp, [ip], #4 ) > diff --git a/arch/arm/kernel/process.c b/arch/arm/kernel/process.c > index c6dec5f..ea298d2 100644 > --- a/arch/arm/kernel/process.c > +++ b/arch/arm/kernel/process.c > @@ -400,7 +400,7 @@ copy_thread(unsigned long clone_flags, unsigned long stack_start, > clear_ptrace_hw_breakpoint(p); > > if (clone_flags & CLONE_SETTLS) > - thread->tp_value = childregs->ARM_r3; > + thread->tp_value[0] = childregs->ARM_r3; > > thread_notify(THREAD_NOTIFY_COPY, thread); > > diff --git a/arch/arm/kernel/ptrace.c b/arch/arm/kernel/ptrace.c > index 03deeff..2bc1514 100644 > --- a/arch/arm/kernel/ptrace.c > +++ b/arch/arm/kernel/ptrace.c > @@ -849,7 +849,7 @@ long arch_ptrace(struct task_struct *child, long request, > #endif > > case PTRACE_GET_THREAD_AREA: > - ret = put_user(task_thread_info(child)->tp_value, > + ret = put_user(task_thread_info(child)->tp_value[0], > datap); > break; > > diff --git a/arch/arm/kernel/traps.c b/arch/arm/kernel/traps.c > index b0179b8..08b0db9 100644 > --- a/arch/arm/kernel/traps.c > +++ b/arch/arm/kernel/traps.c > @@ -588,7 +588,7 @@ asmlinkage int arm_syscall(int no, struct pt_regs *regs) > return regs->ARM_r0; > > case NR(set_tls): > - thread->tp_value = regs->ARM_r0; > + thread->tp_value[0] = regs->ARM_r0; > if (tls_emu) > return 0; > if (has_tls_reg) { > @@ -706,7 +706,7 @@ static int get_tp_trap(struct pt_regs *regs, unsigned int instr) > int reg = (instr >> 12) & 15; > if (reg == 15) > return 1; > - regs->uregs[reg] = current_thread_info()->tp_value; > + regs->uregs[reg] = current_thread_info()->tp_value[0]; > regs->ARM_pc += 4; > return 0; > } >
Hi Andre, On Tue, Feb 12, 2013 at 02:02:59PM +0000, André Hentschel wrote: > Am 08.02.2013 16:48, schrieb Will Deacon: > > On Wed, Feb 06, 2013 at 11:01:23PM +0000, André Hentschel wrote: > >> No, i'm not sure how to improve this. How does the process can continue, can you or someone else fix that and add his Signed-off-by? > > > > How about something like the (completely untested) diff below? > > > > Andre: if this works for you, I'm happy to write a commit message etc. > > Thx for your effort, but it doesn't work, at least not with my 3.4.6 suse kernel. > Be free to have another try, i'll be happy to test it. Well, cheers for testing. Can you be more specific about what goes wrong please? What do you see in TPIDRURW? Will
Am 12.02.2013 15:09, schrieb Will Deacon: > Hi Andre, > > On Tue, Feb 12, 2013 at 02:02:59PM +0000, André Hentschel wrote: >> Am 08.02.2013 16:48, schrieb Will Deacon: >>> On Wed, Feb 06, 2013 at 11:01:23PM +0000, André Hentschel wrote: >>>> No, i'm not sure how to improve this. How does the process can continue, can you or someone else fix that and add his Signed-off-by? >>> >>> How about something like the (completely untested) diff below? >>> >>> Andre: if this works for you, I'm happy to write a commit message etc. >> >> Thx for your effort, but it doesn't work, at least not with my 3.4.6 suse kernel. >> Be free to have another try, i'll be happy to test it. > > Well, cheers for testing. Can you be more specific about what goes wrong > please? What do you see in TPIDRURW? > > Will > -- > To unsubscribe from this list: send the line "unsubscribe linux-arch" in > the body of a message to majordomo@vger.kernel.org > More majordomo info at http://vger.kernel.org/majordomo-info.html > Hi Will, it's 0x00000000 again.
Will Deacon a écrit : > Hi Andre, > > On Tue, Feb 12, 2013 at 02:02:59PM +0000, André Hentschel wrote: >> Am 08.02.2013 16:48, schrieb Will Deacon: >>> On Wed, Feb 06, 2013 at 11:01:23PM +0000, André Hentschel wrote: >>>> No, i'm not sure how to improve this. How does the process can continue, can you or someone else fix that and add his Signed-off-by? >>> How about something like the (completely untested) diff below? >>> >>> Andre: if this works for you, I'm happy to write a commit message etc. >> Thx for your effort, but it doesn't work, at least not with my 3.4.6 suse kernel. >> Be free to have another try, i'll be happy to test it. > > Well, cheers for testing. Can you be more specific about what goes wrong > please? What do you see in TPIDRURW? > The tls value is never saved to : thread->tp_value[1]. Also I don't know if you can avoid the extra ldr in the software case. Matthieu
Am 12.02.2013 16:02, schrieb Matthieu CASTET: > Will Deacon a écrit : >> Hi Andre, >> >> On Tue, Feb 12, 2013 at 02:02:59PM +0000, André Hentschel wrote: >>> Am 08.02.2013 16:48, schrieb Will Deacon: >>>> On Wed, Feb 06, 2013 at 11:01:23PM +0000, André Hentschel wrote: >>>>> No, i'm not sure how to improve this. How does the process can continue, can you or someone else fix that and add his Signed-off-by? >>>> How about something like the (completely untested) diff below? >>>> >>>> Andre: if this works for you, I'm happy to write a commit message etc. >>> Thx for your effort, but it doesn't work, at least not with my 3.4.6 suse kernel. >>> Be free to have another try, i'll be happy to test it. >> >> Well, cheers for testing. Can you be more specific about what goes wrong >> please? What do you see in TPIDRURW? >> > The tls value is never saved to : thread->tp_value[1]. > > Also I don't know if you can avoid the extra ldr in the software case. > > Matthieu > -- > To unsubscribe from this list: send the line "unsubscribe linux-arch" in > the body of a message to majordomo@vger.kernel.org > More majordomo info at http://vger.kernel.org/majordomo-info.html > Hi Will, seems like Matthieu is right, any update on this?
Hi Andre, On Wed, Feb 20, 2013 at 07:34:37PM +0000, André Hentschel wrote: > Am 12.02.2013 16:02, schrieb Matthieu CASTET: > > The tls value is never saved to : thread->tp_value[1]. > > > > Also I don't know if you can avoid the extra ldr in the software case. > > seems like Matthieu is right, any update on this? Yeah, I'll get round to this after the merge window and send a v2. I have a nice long flight to Hong Kong on the horizon, which may well drive me to writing patches :) Cheers, Will
diff --git a/arch/arm/include/asm/thread_info.h b/arch/arm/include/asm/thread_info.h index cddda1f..d90be6d 100644 --- a/arch/arm/include/asm/thread_info.h +++ b/arch/arm/include/asm/thread_info.h @@ -58,7 +58,7 @@ struct thread_info { struct cpu_context_save cpu_context; /* cpu context */ __u32 syscall; /* syscall number */ __u8 used_cp[16]; /* thread used copro */ - unsigned long tp_value; + unsigned long tp_value[2]; /* TLS registers */ #ifdef CONFIG_CRUNCH struct crunch_state crunchstate; #endif diff --git a/arch/arm/include/asm/tls.h b/arch/arm/include/asm/tls.h index 73409e6..e1b09d32 100644 --- a/arch/arm/include/asm/tls.h +++ b/arch/arm/include/asm/tls.h @@ -6,9 +6,9 @@ .endm .macro set_tls_v6k, tp, tmp1, tmp2 - mcr p15, 0, \tp, c13, c0, 3 @ set TLS register - mov \tmp1, #0 - mcr p15, 0, \tmp1, c13, c0, 2 @ clear user r/w TLS register + ldrd \tmp1, \tmp2, [\tp] + mcr p15, 0, \tmp1, c13, c0, 3 @ set user r/o TLS register + mcr p15, 0, \tmp2, c13, c0, 2 @ set user r/w TLS register .endm .macro set_tls_v6, tp, tmp1, tmp2 @@ -16,15 +16,17 @@ ldr \tmp1, [\tmp1, #0] mov \tmp2, #0xffff0fff tst \tmp1, #HWCAP_TLS @ hardware TLS available? - mcrne p15, 0, \tp, c13, c0, 3 @ yes, set TLS register - movne \tmp1, #0 - mcrne p15, 0, \tmp1, c13, c0, 2 @ clear user r/w TLS register - streq \tp, [\tmp2, #-15] @ set TLS value at 0xffff0ff0 + ldrdne \tmp1, \tmp2, [\tp] + ldreq \tmp1, [\tp] + mcrne p15, 0, \tmp1, c13, c0, 3 @ yes, set user r/o TLS register + mcrne p15, 0, \tmp2, c13, c0, 2 @ set user r/w TLS register + streq \tmp1, [\tmp2, #-15] @ set TLS value at 0xffff0ff0 .endm .macro set_tls_software, tp, tmp1, tmp2 - mov \tmp1, #0xffff0fff - str \tp, [\tmp1, #-15] @ set TLS value at 0xffff0ff0 + ldr \tmp1, [\tp] + mov \tmp2, #0xffff0fff + str \tmp1, [\tmp2, #-15] @ set TLS value at 0xffff0ff0 .endm #endif diff --git a/arch/arm/kernel/entry-armv.S b/arch/arm/kernel/entry-armv.S index 0f82098..a0a8fe3 100644 --- a/arch/arm/kernel/entry-armv.S +++ b/arch/arm/kernel/entry-armv.S @@ -728,7 +728,7 @@ ENTRY(__switch_to) UNWIND(.fnstart ) UNWIND(.cantunwind ) add ip, r1, #TI_CPU_SAVE - ldr r3, [r2, #TI_TP_VALUE] + add r3, r2, #TI_TP_VALUE ARM( stmia ip!, {r4 - sl, fp, sp, lr} ) @ Store most regs on stack THUMB( stmia ip!, {r4 - sl, fp} ) @ Store most regs on stack THUMB( str sp, [ip], #4 ) diff --git a/arch/arm/kernel/process.c b/arch/arm/kernel/process.c index c6dec5f..ea298d2 100644 --- a/arch/arm/kernel/process.c +++ b/arch/arm/kernel/process.c @@ -400,7 +400,7 @@ copy_thread(unsigned long clone_flags, unsigned long stack_start, clear_ptrace_hw_breakpoint(p); if (clone_flags & CLONE_SETTLS) - thread->tp_value = childregs->ARM_r3; + thread->tp_value[0] = childregs->ARM_r3; thread_notify(THREAD_NOTIFY_COPY, thread); diff --git a/arch/arm/kernel/ptrace.c b/arch/arm/kernel/ptrace.c index 03deeff..2bc1514 100644 --- a/arch/arm/kernel/ptrace.c +++ b/arch/arm/kernel/ptrace.c @@ -849,7 +849,7 @@ long arch_ptrace(struct task_struct *child, long request, #endif case PTRACE_GET_THREAD_AREA: - ret = put_user(task_thread_info(child)->tp_value, + ret = put_user(task_thread_info(child)->tp_value[0], datap); break; diff --git a/arch/arm/kernel/traps.c b/arch/arm/kernel/traps.c index b0179b8..08b0db9 100644 --- a/arch/arm/kernel/traps.c +++ b/arch/arm/kernel/traps.c @@ -588,7 +588,7 @@ asmlinkage int arm_syscall(int no, struct pt_regs *regs) return regs->ARM_r0; case NR(set_tls): - thread->tp_value = regs->ARM_r0; + thread->tp_value[0] = regs->ARM_r0; if (tls_emu) return 0; if (has_tls_reg) { @@ -706,7 +706,7 @@ static int get_tp_trap(struct pt_regs *regs, unsigned int instr) int reg = (instr >> 12) & 15; if (reg == 15) return 1; - regs->uregs[reg] = current_thread_info()->tp_value; + regs->uregs[reg] = current_thread_info()->tp_value[0]; regs->ARM_pc += 4; return 0; }