arch/powerpc/platforms/cell/spufs/run.c

   1 #define DEBUG
   2
   3 #include <linux/wait.h>
   4 #include <linux/ptrace.h>
   5
   6 #include <asm/spu.h>
   7 #include <asm/spu_priv1.h>
   8 #include <asm/io.h>
   9 #include <asm/unistd.h>
  10
  11 #include "spufs.h"
  12
  13 /* interrupt-level stop callback function. */
  14 void spufs_stop_callback(struct spu *spu)
  15 {
  16         struct spu_context *ctx = spu->ctx;
  17
  18         /*
  19          * It should be impossible to preempt a context while an exception
  20          * is being processed, since the context switch code is specially
  21          * coded to deal with interrupts ... But, just in case, sanity check
  22          * the context pointer.  It is OK to return doing nothing since
  23          * the exception will be regenerated when the context is resumed.
  24          */
  25         if (ctx) {
  26                 /* Copy exception arguments into module specific structure */
  27                 ctx->csa.class_0_pending = spu->class_0_pending;
  28                 ctx->csa.dsisr = spu->dsisr;
  29                 ctx->csa.dar = spu->dar;
  30
  31                 /* ensure that the exception status has hit memory before a
  32                  * thread waiting on the context's stop queue is woken */
  33                 smp_wmb();
  34
  35                 wake_up_all(&ctx->stop_wq);
  36         }
  37
  38         /* Clear callback arguments from spu structure */
  39         spu->class_0_pending = 0;
  40         spu->dsisr = 0;
  41         spu->dar = 0;
  42 }
  43
  44 int spu_stopped(struct spu_context *ctx, u32 *stat)
  45 {
  46         u64 dsisr;
  47         u32 stopped;
  48
  49         *stat = ctx->ops->status_read(ctx);
  50
  51         if (test_bit(SPU_SCHED_NOTIFY_ACTIVE, &ctx->sched_flags))
  52                 return 1;
  53
  54         stopped = SPU_STATUS_INVALID_INSTR | SPU_STATUS_SINGLE_STEP |
  55                 SPU_STATUS_STOPPED_BY_HALT | SPU_STATUS_STOPPED_BY_STOP;
  56         if (!(*stat & SPU_STATUS_RUNNING) && (*stat & stopped))
  57                 return 1;
  58
  59         dsisr = ctx->csa.dsisr;
  60         if (dsisr & (MFC_DSISR_PTE_NOT_FOUND | MFC_DSISR_ACCESS_DENIED))
  61                 return 1;
  62
  63         if (ctx->csa.class_0_pending)
  64                 return 1;
  65
  66         return 0;
  67 }
  68
  69 static int spu_setup_isolated(struct spu_context *ctx)
  70 {
  71         int ret;
  72         u64 __iomem *mfc_cntl;
  73         u64 sr1;
  74         u32 status;
  75         unsigned long timeout;
  76         const u32 status_loading = SPU_STATUS_RUNNING
  77                 | SPU_STATUS_ISOLATED_STATE | SPU_STATUS_ISOLATED_LOAD_STATUS;
  78
  79         ret = -ENODEV;
  80         if (!isolated_loader)
  81                 goto out;
  82
  83         /*
  84          * We need to exclude userspace access to the context.
  85          *
  86          * To protect against memory access we invalidate all ptes
  87          * and make sure the pagefault handlers block on the mutex.
  88          */
  89         spu_unmap_mappings(ctx);
  90
  91         mfc_cntl = &ctx->spu->priv2->mfc_control_RW;
  92
  93         /* purge the MFC DMA queue to ensure no spurious accesses before we
  94          * enter kernel mode */
  95         timeout = jiffies + HZ;
  96         out_be64(mfc_cntl, MFC_CNTL_PURGE_DMA_REQUEST);
  97         while ((in_be64(mfc_cntl) & MFC_CNTL_PURGE_DMA_STATUS_MASK)
  98                         != MFC_CNTL_PURGE_DMA_COMPLETE) {
  99                 if (time_after(jiffies, timeout)) {
 100                         printk(KERN_ERR "%s: timeout flushing MFC DMA queue\n",
 101                                         __FUNCTION__);
 102                         ret = -EIO;
 103                         goto out;
 104                 }
 105                 cond_resched();
 106         }
 107
 108         /* put the SPE in kernel mode to allow access to the loader */
 109         sr1 = spu_mfc_sr1_get(ctx->spu);
 110         sr1 &= ~MFC_STATE1_PROBLEM_STATE_MASK;
 111         spu_mfc_sr1_set(ctx->spu, sr1);
 112
 113         /* start the loader */
 114         ctx->ops->signal1_write(ctx, (unsigned long)isolated_loader >> 32);
 115         ctx->ops->signal2_write(ctx,
 116                         (unsigned long)isolated_loader & 0xffffffff);
 117
 118         ctx->ops->runcntl_write(ctx,
 119                         SPU_RUNCNTL_RUNNABLE | SPU_RUNCNTL_ISOLATE);
 120
 121         ret = 0;
 122         timeout = jiffies + HZ;
 123         while (((status = ctx->ops->status_read(ctx)) & status_loading) ==
 124                                 status_loading) {
 125                 if (time_after(jiffies, timeout)) {
 126                         printk(KERN_ERR "%s: timeout waiting for loader\n",
 127                                         __FUNCTION__);
 128                         ret = -EIO;
 129                         goto out_drop_priv;
 130                 }
 131                 cond_resched();
 132         }
 133
 134         if (!(status & SPU_STATUS_RUNNING)) {
 135                 /* If isolated LOAD has failed: run SPU, we will get a stop-and
 136                  * signal later. */
 137                 pr_debug("%s: isolated LOAD failed\n", __FUNCTION__);
 138                 ctx->ops->runcntl_write(ctx, SPU_RUNCNTL_RUNNABLE);
 139                 ret = -EACCES;
 140                 goto out_drop_priv;
 141         }
 142
 143         if (!(status & SPU_STATUS_ISOLATED_STATE)) {
 144                 /* This isn't allowed by the CBEA, but check anyway */
 145                 pr_debug("%s: SPU fell out of isolated mode?\n", __FUNCTION__);
 146                 ctx->ops->runcntl_write(ctx, SPU_RUNCNTL_STOP);
 147                 ret = -EINVAL;
 148                 goto out_drop_priv;
 149         }
 150
 151 out_drop_priv:
 152         /* Finished accessing the loader. Drop kernel mode */
 153         sr1 |= MFC_STATE1_PROBLEM_STATE_MASK;
 154         spu_mfc_sr1_set(ctx->spu, sr1);
 155
 156 out:
 157         return ret;
 158 }
 159
 160 static int spu_run_init(struct spu_context *ctx, u32 *npc)
 161 {
 162         unsigned long runcntl = SPU_RUNCNTL_RUNNABLE;
 163         int ret;
 164
 165         spuctx_switch_state(ctx, SPU_UTIL_SYSTEM);
 166
 167         /*
 168          * NOSCHED is synchronous scheduling with respect to the caller.
 169          * The caller waits for the context to be loaded.
 170          */
 171         if (ctx->flags & SPU_CREATE_NOSCHED) {
 172                 if (ctx->state == SPU_STATE_SAVED) {
 173                         ret = spu_activate(ctx, 0);
 174                         if (ret)
 175                                 return ret;
 176                 }
 177         }
 178
 179         /*
 180          * Apply special setup as required.
 181          */
 182         if (ctx->flags & SPU_CREATE_ISOLATE) {
 183                 if (!(ctx->ops->status_read(ctx) & SPU_STATUS_ISOLATED_STATE)) {
 184                         ret = spu_setup_isolated(ctx);
 185                         if (ret)
 186                                 return ret;
 187                 }
 188
 189                 /*
 190                  * If userspace has set the runcntrl register (eg, to
 191                  * issue an isolated exit), we need to re-set it here
 192                  */
 193                 runcntl = ctx->ops->runcntl_read(ctx) &
 194                         (SPU_RUNCNTL_RUNNABLE | SPU_RUNCNTL_ISOLATE);
 195                 if (runcntl == 0)
 196                         runcntl = SPU_RUNCNTL_RUNNABLE;
 197         }
 198
 199         if (ctx->flags & SPU_CREATE_NOSCHED) {
 200                 spuctx_switch_state(ctx, SPU_UTIL_USER);
 201                 ctx->ops->runcntl_write(ctx, runcntl);
 202         } else {
 203                 unsigned long privcntl;
 204
 205                 if (test_thread_flag(TIF_SINGLESTEP))
 206                         privcntl = SPU_PRIVCNTL_MODE_SINGLE_STEP;
 207                 else
 208                         privcntl = SPU_PRIVCNTL_MODE_NORMAL;
 209
 210                 ctx->ops->npc_write(ctx, *npc);
 211                 ctx->ops->privcntl_write(ctx, privcntl);
 212                 ctx->ops->runcntl_write(ctx, runcntl);
 213
 214                 if (ctx->state == SPU_STATE_SAVED) {
 215                         ret = spu_activate(ctx, 0);
 216                         if (ret)
 217                                 return ret;
 218                 } else {
 219                         spuctx_switch_state(ctx, SPU_UTIL_USER);
 220                 }
 221         }
 222
 223         set_bit(SPU_SCHED_SPU_RUN, &ctx->sched_flags);
 224         return 0;
 225 }
 226
 227 static int spu_run_fini(struct spu_context *ctx, u32 *npc,
 228                                u32 *status)
 229 {
 230         int ret = 0;
 231
 232         spu_del_from_rq(ctx);
 233
 234         *status = ctx->ops->status_read(ctx);
 235         *npc = ctx->ops->npc_read(ctx);
 236
 237         spuctx_switch_state(ctx, SPU_UTIL_IDLE_LOADED);
 238         clear_bit(SPU_SCHED_SPU_RUN, &ctx->sched_flags);
 239         spu_release(ctx);
 240
 241         if (signal_pending(current))
 242                 ret = -ERESTARTSYS;
 243
 244         return ret;
 245 }
 246
 247 /*
 248  * SPU syscall restarting is tricky because we violate the basic
 249  * assumption that the signal handler is running on the interrupted
 250  * thread. Here instead, the handler runs on PowerPC user space code,
 251  * while the syscall was called from the SPU.
 252  * This means we can only do a very rough approximation of POSIX
 253  * signal semantics.
 254  */
 255 static int spu_handle_restartsys(struct spu_context *ctx, long *spu_ret,
 256                           unsigned int *npc)
 257 {
 258         int ret;
 259
 260         switch (*spu_ret) {
 261         case -ERESTARTSYS:
 262         case -ERESTARTNOINTR:
 263                 /*
 264                  * Enter the regular syscall restarting for
 265                  * sys_spu_run, then restart the SPU syscall
 266                  * callback.
 267                  */
 268                 *npc -= 8;
 269                 ret = -ERESTARTSYS;
 270                 break;
 271         case -ERESTARTNOHAND:
 272         case -ERESTART_RESTARTBLOCK:
 273                 /*
 274                  * Restart block is too hard for now, just return -EINTR
 275                  * to the SPU.
 276                  * ERESTARTNOHAND comes from sys_pause, we also return
 277                  * -EINTR from there.
 278                  * Assume that we need to be restarted ourselves though.
 279                  */
 280                 *spu_ret = -EINTR;
 281                 ret = -ERESTARTSYS;
 282                 break;
 283         default:
 284                 printk(KERN_WARNING "%s: unexpected return code %ld\n",
 285                         __FUNCTION__, *spu_ret);
 286                 ret = 0;
 287         }
 288         return ret;
 289 }
 290
 291 static int spu_process_callback(struct spu_context *ctx)
 292 {
 293         struct spu_syscall_block s;
 294         u32 ls_pointer, npc;
 295         void __iomem *ls;
 296         long spu_ret;
 297         int ret, ret2;
 298
 299         /* get syscall block from local store */
 300         npc = ctx->ops->npc_read(ctx) & ~3;
 301         ls = (void __iomem *)ctx->ops->get_ls(ctx);
 302         ls_pointer = in_be32(ls + npc);
 303         if (ls_pointer > (LS_SIZE - sizeof(s)))
 304                 return -EFAULT;
 305         memcpy_fromio(&s, ls + ls_pointer, sizeof(s));
 306
 307         /* do actual syscall without pinning the spu */
 308         ret = 0;
 309         spu_ret = -ENOSYS;
 310         npc += 4;
 311
 312         if (s.nr_ret < __NR_syscalls) {
 313                 spu_release(ctx);
 314                 /* do actual system call from here */
 315                 spu_ret = spu_sys_callback(&s);
 316                 if (spu_ret <= -ERESTARTSYS) {
 317                         ret = spu_handle_restartsys(ctx, &spu_ret, &npc);
 318                 }
 319                 ret2 = spu_acquire(ctx);
 320                 if (ret == -ERESTARTSYS)
 321                         return ret;
 322                 if (ret2)
 323                         return -EINTR;
 324         }
 325
 326         /* write result, jump over indirect pointer */
 327         memcpy_toio(ls + ls_pointer, &spu_ret, sizeof(spu_ret));
 328         ctx->ops->npc_write(ctx, npc);
 329         ctx->ops->runcntl_write(ctx, SPU_RUNCNTL_RUNNABLE);
 330         return ret;
 331 }
 332
 333 long spufs_run_spu(struct spu_context *ctx, u32 *npc, u32 *event)
 334 {
 335         int ret;
 336         struct spu *spu;
 337         u32 status;
 338
 339         if (mutex_lock_interruptible(&ctx->run_mutex))
 340                 return -ERESTARTSYS;
 341
 342         spu_enable_spu(ctx);
 343         ctx->event_return = 0;
 344
 345         ret = spu_acquire(ctx);
 346         if (ret)
 347                 goto out_unlock;
 348
 349         spu_update_sched_info(ctx);
 350
 351         ret = spu_run_init(ctx, npc);
 352         if (ret) {
 353                 spu_release(ctx);
 354                 goto out;
 355         }
 356
 357         do {
 358                 ret = spufs_wait(ctx->stop_wq, spu_stopped(ctx, &status));
 359                 if (unlikely(ret)) {
 360                         /*
 361                          * This is nasty: we need the state_mutex for all the
 362                          * bookkeeping even if the syscall was interrupted by
 363                          * a signal. ewww.
 364                          */
 365                         mutex_lock(&ctx->state_mutex);
 366                         break;
 367                 }
 368                 spu = ctx->spu;
 369                 if (unlikely(test_and_clear_bit(SPU_SCHED_NOTIFY_ACTIVE,
 370                                                 &ctx->sched_flags))) {
 371                         if (!(status & SPU_STATUS_STOPPED_BY_STOP)) {
 372                                 spu_switch_notify(spu, ctx);
 373                                 continue;
 374                         }
 375                 }
 376
 377                 spuctx_switch_state(ctx, SPU_UTIL_SYSTEM);
 378
 379                 if ((status & SPU_STATUS_STOPPED_BY_STOP) &&
 380                     (status >> SPU_STOP_STATUS_SHIFT == 0x2104)) {
 381                         ret = spu_process_callback(ctx);
 382                         if (ret)
 383                                 break;
 384                         status &= ~SPU_STATUS_STOPPED_BY_STOP;
 385                 }
 386                 ret = spufs_handle_class1(ctx);
 387                 if (ret)
 388                         break;
 389
 390                 ret = spufs_handle_class0(ctx);
 391                 if (ret)
 392                         break;
 393
 394                 if (signal_pending(current))
 395                         ret = -ERESTARTSYS;
 396         } while (!ret && !(status & (SPU_STATUS_STOPPED_BY_STOP |
 397                                       SPU_STATUS_STOPPED_BY_HALT |
 398                                        SPU_STATUS_SINGLE_STEP)));
 399
 400         spu_disable_spu(ctx);
 401         ret = spu_run_fini(ctx, npc, &status);
 402         spu_yield(ctx);
 403
 404         if ((status & SPU_STATUS_STOPPED_BY_STOP) &&
 405             (((status >> SPU_STOP_STATUS_SHIFT) & 0x3f00) == 0x2100))
 406                 ctx->stats.libassist++;
 407
 408         if ((ret == 0) ||
 409             ((ret == -ERESTARTSYS) &&
 410              ((status & SPU_STATUS_STOPPED_BY_HALT) ||
 411               (status & SPU_STATUS_SINGLE_STEP) ||
 412               ((status & SPU_STATUS_STOPPED_BY_STOP) &&
 413                (status >> SPU_STOP_STATUS_SHIFT != 0x2104)))))
 414                 ret = status;
 415
 416         /* Note: we don't need to force_sig SIGTRAP on single-step
 417          * since we have TIF_SINGLESTEP set, thus the kernel will do
 418          * it upon return from the syscall anyawy
 419          */
 420         if (unlikely(status & SPU_STATUS_SINGLE_STEP))
 421                 ret = -ERESTARTSYS;
 422
 423         else if (unlikely((status & SPU_STATUS_STOPPED_BY_STOP)
 424             && (status >> SPU_STOP_STATUS_SHIFT) == 0x3fff)) {
 425                 force_sig(SIGTRAP, current);
 426                 ret = -ERESTARTSYS;
 427         }
 428
 429 out:
 430         *event = ctx->event_return;
 431 out_unlock:
 432         mutex_unlock(&ctx->run_mutex);
 433         return ret;
 434 }