Received: by 2002:a05:6a10:17d3:0:0:0:0 with SMTP id hz19csp3358462pxb; Tue, 20 Apr 2021 06:40:40 -0700 (PDT) X-Google-Smtp-Source: ABdhPJyxHKKx+KMJkOOIc92oc2gF5PNG+jz+KsDstPInzQ/RHjoRKuZ/IeBRMCgvzvEsixkrFFQB X-Received: by 2002:a17:906:a0c2:: with SMTP id bh2mr26965196ejb.394.1618926039958; Tue, 20 Apr 2021 06:40:39 -0700 (PDT) ARC-Seal: i=1; a=rsa-sha256; t=1618926039; cv=none; d=google.com; s=arc-20160816; b=yedEKUwmfxNAkKnUKx+okrcFVo7SNtl31lGBej/GxN7NgUl7Xboid0IknqFc6Og38+ 9x0rR4auotIFuVLp3gArx985HUud+AnK/6VoHNgJZQgzrM1I4mR9jRsQSAJGFR3TZZ0M /Rrdq1qjGqXpJMk6cVRyJRM36E/HItpdzZtGug5RtFWPDgsjPHMwoWY9HsBJ6yKbuUJE pj8buhO8opJ6E5Bz4THUuAkF5P7i9dDIbtTRLNz0/EePD2WYanvsm0zzVFmvqwV8QQt7 Q+dLmlLpQ72zuFvFCi5TTXEy7O9rZYAG+O+LsLXnAAGNLGTLLJ64Afe5fsotRJ7ZuTUh EEcQ== ARC-Message-Signature: i=1; a=rsa-sha256; c=relaxed/relaxed; d=google.com; s=arc-20160816; h=list-id:precedence:content-transfer-encoding:content-language :in-reply-to:mime-version:user-agent:date:message-id:from:references :cc:to:subject; bh=nocWU6eKQizzfIO6eCjFP0d9WrEygWajrhAFPCfsaSA=; b=iYJrTbdxtk6vmaFIvMecP/CeYGnyWC3niqMPWsIfnyGdiwxvSum05kj5pNKwN6D6tb Img1epplxGKsxXLBSG1apFvuXf7GL9W0z3zJsAnCNGUtiWN+N+9CQ+K14JSALlz0hPbW 0N4olU+hrilA0sJu2PtDGpwLB+QFnOJ4VBt/k1AiwJtYANgzTuNCInan15hn+XtFCS0o mdSvBkbAhPIkWjJ9svYpw4JUoq1jO4QAS43fwLtTn5wsicVaxDOmPvmdH9zhNw4yefRK Ijwa43WsfHUxglu7pVRt6gOx6zox4nEF6K6FJyK5WNMnVnDFRVFQiYvA5+MVaFjaHIui rMhA== ARC-Authentication-Results: i=1; mx.google.com; spf=pass (google.com: domain of linux-kernel-owner@vger.kernel.org designates 23.128.96.18 as permitted sender) smtp.mailfrom=linux-kernel-owner@vger.kernel.org Return-Path: Received: from vger.kernel.org (vger.kernel.org. [23.128.96.18]) by mx.google.com with ESMTP id zo17si15385280ejb.1.2021.04.20.06.40.15; Tue, 20 Apr 2021 06:40:39 -0700 (PDT) Received-SPF: pass (google.com: domain of linux-kernel-owner@vger.kernel.org designates 23.128.96.18 as permitted sender) client-ip=23.128.96.18; Authentication-Results: mx.google.com; spf=pass (google.com: domain of linux-kernel-owner@vger.kernel.org designates 23.128.96.18 as permitted sender) smtp.mailfrom=linux-kernel-owner@vger.kernel.org Received: (majordomo@vger.kernel.org) by vger.kernel.org via listexpand id S232516AbhDTNhm (ORCPT + 99 others); Tue, 20 Apr 2021 09:37:42 -0400 Received: from pegase1.c-s.fr ([93.17.236.30]:48423 "EHLO pegase1.c-s.fr" rhost-flags-OK-OK-OK-OK) by vger.kernel.org with ESMTP id S232448AbhDTNhk (ORCPT ); Tue, 20 Apr 2021 09:37:40 -0400 Received: from localhost (mailhub1-int [192.168.12.234]) by localhost (Postfix) with ESMTP id 4FPl8y69TZz9txpD; Tue, 20 Apr 2021 15:37:06 +0200 (CEST) X-Virus-Scanned: Debian amavisd-new at c-s.fr Received: from pegase1.c-s.fr ([192.168.12.234]) by localhost (pegase1.c-s.fr [192.168.12.234]) (amavisd-new, port 10024) with ESMTP id e1dt6YejAfoj; Tue, 20 Apr 2021 15:37:06 +0200 (CEST) Received: from messagerie.si.c-s.fr (messagerie.si.c-s.fr [192.168.25.192]) by pegase1.c-s.fr (Postfix) with ESMTP id 4FPl8y5FKpz9tvgb; Tue, 20 Apr 2021 15:37:06 +0200 (CEST) Received: from localhost (localhost [127.0.0.1]) by messagerie.si.c-s.fr (Postfix) with ESMTP id 138B78B807; Tue, 20 Apr 2021 15:37:08 +0200 (CEST) X-Virus-Scanned: amavisd-new at c-s.fr Received: from messagerie.si.c-s.fr ([127.0.0.1]) by localhost (messagerie.si.c-s.fr [127.0.0.1]) (amavisd-new, port 10023) with ESMTP id xkfkUA4ekOeJ; Tue, 20 Apr 2021 15:37:07 +0200 (CEST) Received: from [192.168.4.90] (unknown [192.168.4.90]) by messagerie.si.c-s.fr (Postfix) with ESMTP id 765018B80A; Tue, 20 Apr 2021 15:37:07 +0200 (CEST) Subject: Re: [PATCH v1 2/2] powerpc: Enable OPTPROBES on PPC32 To: "Naveen N. Rao" , Benjamin Herrenschmidt , Michael Ellerman , Paul Mackerras Cc: linux-kernel@vger.kernel.org, linuxppc-dev@lists.ozlabs.org References: <28730d147adeaa6c2d0c98d0aa9e17e9e4bd043a.1617701875.git.christophe.leroy@csgroup.eu> <1618900760.son2fwciv1.naveen@linux.ibm.com> From: Christophe Leroy Message-ID: Date: Tue, 20 Apr 2021 15:37:06 +0200 User-Agent: Mozilla/5.0 (Windows NT 6.1; Win64; x64; rv:78.0) Gecko/20100101 Thunderbird/78.9.1 MIME-Version: 1.0 In-Reply-To: <1618900760.son2fwciv1.naveen@linux.ibm.com> Content-Type: text/plain; charset=utf-8; format=flowed Content-Language: fr Content-Transfer-Encoding: 8bit Precedence: bulk List-ID: X-Mailing-List: linux-kernel@vger.kernel.org Le 20/04/2021 à 08:51, Naveen N. Rao a écrit : > Christophe Leroy wrote: >> For that, create a 32 bits version of patch_imm64_load_insns() >> and create a patch_imm_load_insns() which calls >> patch_imm32_load_insns() on PPC32 and patch_imm64_load_insns() >> on PPC64. >> >> Adapt optprobes_head.S for PPC32. Use PPC_LL/PPC_STL macros instead >> of raw ld/std, opt out things linked to paca and use stmw/lmw to >> save/restore registers. >> >> Signed-off-by: Christophe Leroy >> --- >>  arch/powerpc/Kconfig                 |  2 +- >>  arch/powerpc/kernel/optprobes.c      | 24 +++++++++++++-- >>  arch/powerpc/kernel/optprobes_head.S | 46 +++++++++++++++++++--------- >>  3 files changed, 53 insertions(+), 19 deletions(-) > > Thanks for adding support for ppc32. It is good to see that it works without too many changes. > >> >> diff --git a/arch/powerpc/Kconfig b/arch/powerpc/Kconfig >> index c1344c05226c..49b538e54efb 100644 >> --- a/arch/powerpc/Kconfig >> +++ b/arch/powerpc/Kconfig >> @@ -227,7 +227,7 @@ config PPC >>      select HAVE_MOD_ARCH_SPECIFIC >>      select HAVE_NMI                if PERF_EVENTS || (PPC64 && PPC_BOOK3S) >>      select HAVE_HARDLOCKUP_DETECTOR_ARCH    if PPC64 && PPC_BOOK3S && SMP >> -    select HAVE_OPTPROBES            if PPC64 >> +    select HAVE_OPTPROBES >>      select HAVE_PERF_EVENTS >>      select HAVE_PERF_EVENTS_NMI        if PPC64 >>      select HAVE_HARDLOCKUP_DETECTOR_PERF    if PERF_EVENTS && HAVE_PERF_EVENTS_NMI && >> !HAVE_HARDLOCKUP_DETECTOR_ARCH >> diff --git a/arch/powerpc/kernel/optprobes.c b/arch/powerpc/kernel/optprobes.c >> index 58fdb9f66e0f..cdf87086fa33 100644 >> --- a/arch/powerpc/kernel/optprobes.c >> +++ b/arch/powerpc/kernel/optprobes.c >> @@ -141,11 +141,21 @@ void arch_remove_optimized_kprobe(struct optimized_kprobe *op) >>      } >>  } >> >> +static void patch_imm32_load_insns(unsigned long val, int reg, kprobe_opcode_t *addr) >> +{ >> +    patch_instruction((struct ppc_inst *)addr, >> +              ppc_inst(PPC_RAW_LIS(reg, IMM_H(val)))); >> +    addr++; >> + >> +    patch_instruction((struct ppc_inst *)addr, >> +              ppc_inst(PPC_RAW_ORI(reg, reg, IMM_L(val)))); >> +} >> + >>  /* >>   * Generate instructions to load provided immediate 64-bit value >>   * to register 'reg' and patch these instructions at 'addr'. >>   */ >> -static void patch_imm64_load_insns(unsigned long val, int reg, kprobe_opcode_t *addr) >> +static void patch_imm64_load_insns(unsigned long long val, int reg, kprobe_opcode_t *addr) > > Do you really need this? Without it I get: from arch/powerpc/kernel/optprobes.c:8: arch/powerpc/kernel/optprobes.c: In function 'patch_imm64_load_insns': arch/powerpc/kernel/optprobes.c:163:14: error: right shift count >= width of type [-Werror=shift-count-overflow] 163 | ((val >> 48) & 0xffff))); | ^~ ./arch/powerpc/include/asm/inst.h:69:48: note: in definition of macro 'ppc_inst' 69 | #define ppc_inst(x) ((struct ppc_inst){ .val = x }) | ^ arch/powerpc/kernel/optprobes.c:169:31: error: right shift count >= width of type [-Werror=shift-count-overflow] 169 | ___PPC_RS(reg) | ((val >> 32) & 0xffff))); | ^~ ./arch/powerpc/include/asm/inst.h:69:48: note: in definition of macro 'ppc_inst' 69 | #define ppc_inst(x) ((struct ppc_inst){ .val = x }) | ^ > >>  { >>      /* lis reg,(op)@highest */ >>      patch_instruction((struct ppc_inst *)addr, >> @@ -177,6 +187,14 @@ static void patch_imm64_load_insns(unsigned long val, int reg, kprobe_opcode_t * >>                     ___PPC_RS(reg) | (val & 0xffff))); >>  } >> >> +static void patch_imm_load_insns(unsigned long val, int reg, kprobe_opcode_t *addr) >> +{ >> +    if (IS_ENABLED(CONFIG_PPC64)) >> +        patch_imm64_load_insns(val, reg, addr); >> +    else >> +        patch_imm32_load_insns(val, reg, addr); >> +} >> + >>  int arch_prepare_optimized_kprobe(struct optimized_kprobe *op, struct kprobe *p) >>  { >>      struct ppc_inst branch_op_callback, branch_emulate_step, temp; >> @@ -230,7 +248,7 @@ int arch_prepare_optimized_kprobe(struct optimized_kprobe *op, struct kprobe *p) >>       * Fixup the template with instructions to: >>       * 1. load the address of the actual probepoint >>       */ >> -    patch_imm64_load_insns((unsigned long)op, 3, buff + TMPL_OP_IDX); >> +    patch_imm_load_insns((unsigned long)op, 3, buff + TMPL_OP_IDX); >> >>      /* >>       * 2. branch to optimized_callback() and emulate_step() >> @@ -264,7 +282,7 @@ int arch_prepare_optimized_kprobe(struct optimized_kprobe *op, struct kprobe *p) >>       * 3. load instruction to be emulated into relevant register, and >>       */ >>      temp = ppc_inst_read((struct ppc_inst *)p->ainsn.insn); >> -    patch_imm64_load_insns(ppc_inst_as_ulong(temp), 4, buff + TMPL_INSN_IDX); >> +    patch_imm_load_insns(ppc_inst_as_ulong(temp), 4, buff + TMPL_INSN_IDX); >> >>      /* >>       * 4. branch back from trampoline >> diff --git a/arch/powerpc/kernel/optprobes_head.S b/arch/powerpc/kernel/optprobes_head.S >> index ff8ba4d3824d..49f31e554573 100644 >> --- a/arch/powerpc/kernel/optprobes_head.S >> +++ b/arch/powerpc/kernel/optprobes_head.S >> @@ -30,39 +30,47 @@ optinsn_slot: >>      .global optprobe_template_entry >>  optprobe_template_entry: >>      /* Create an in-memory pt_regs */ >> -    stdu    r1,-INT_FRAME_SIZE(r1) >> +    PPC_STLU    r1,-INT_FRAME_SIZE(r1) >>      SAVE_GPR(0,r1) >>      /* Save the previous SP into stack */ >>      addi    r0,r1,INT_FRAME_SIZE >> -    std    r0,GPR1(r1) >> +    PPC_STL    r0,GPR1(r1) >> +#ifdef CONFIG_PPC64 >>      SAVE_10GPRS(2,r1) >>      SAVE_10GPRS(12,r1) >>      SAVE_10GPRS(22,r1) >> +#else >> +    stmw    r2, GPR2(r1) >> +#endif >>      /* Save SPRS */ >>      mfmsr    r5 >> -    std    r5,_MSR(r1) >> +    PPC_STL    r5,_MSR(r1) >>      li    r5,0x700 >> -    std    r5,_TRAP(r1) >> +    PPC_STL    r5,_TRAP(r1) >>      li    r5,0 >> -    std    r5,ORIG_GPR3(r1) >> -    std    r5,RESULT(r1) >> +    PPC_STL    r5,ORIG_GPR3(r1) >> +    PPC_STL    r5,RESULT(r1) >>      mfctr    r5 >> -    std    r5,_CTR(r1) >> +    PPC_STL    r5,_CTR(r1) >>      mflr    r5 >> -    std    r5,_LINK(r1) >> +    PPC_STL    r5,_LINK(r1) >>      mfspr    r5,SPRN_XER >> -    std    r5,_XER(r1) >> +    PPC_STL    r5,_XER(r1) >>      mfcr    r5 >> -    std    r5,_CCR(r1) >> +    PPC_STL    r5,_CCR(r1) >> +#ifdef CONFIG_PPC64 >>      lbz     r5,PACAIRQSOFTMASK(r13) >>      std     r5,SOFTE(r1) >> +#endif >> >>      /* >>       * We may get here from a module, so load the kernel TOC in r2. >>       * The original TOC gets restored when pt_regs is restored >>       * further below. >>       */ >> +#ifdef CONFIG_PPC64 >>      ld    r2,PACATOC(r13) >> +#endif > > Are the ISA and ABI documents for ppc32 available publicly? ABI: https://wiki.raptorcs.com/w/images/0/03/Power-Arch-32-bit-ABI-supp-1.0-Unified.pdf ISA: https://www.nxp.com/files-static/product/doc/MPCFPE32B.pdf > I would have thought that the TOC issues > apply to ppc32 as well, but want to understand why this isn't a problem there. r2 is the pointer to 'current' on PPC32. No TOC. > >> >>      .global optprobe_template_op_address >>  optprobe_template_op_address: >> @@ -72,9 +80,11 @@ optprobe_template_op_address: >>       */ >>      nop >>      nop >> +#ifdef CONFIG_PPC64 >>      nop >>      nop >>      nop >> +#endif >>      /* 2. pt_regs pointer in r4 */ >>      addi    r4,r1,STACK_FRAME_OVERHEAD >> >> @@ -94,9 +104,11 @@ optprobe_template_insn: >>      /* 2, Pass instruction to be emulated in r4 */ >>      nop >>      nop >> +#ifdef CONFIG_PPC64 >>      nop >>      nop >>      nop >> +#endif > > It would be nice to put these behind a macro so as to avoid these #ifdef blocks here, as well as > with the register save/restore sequence. > Will see what I can do Christophe