MALI: rockchip: upgrade midgard DDK to r13p0-00rel0

[firefly-linux-kernel-4.4.55.git] / drivers / gpu / arm / midgard / mali_kbase_defs.h
diff --git a/drivers/gpu/arm/midgard/mali_kbase_defs.h b/drivers/gpu/arm/midgard/mali_kbase_defs.h

index d0eae8e3486bb65adb9f2a57d34908c9979dcdaf..4bb8c2c7aec23176a4208809a58a087fe4936025 100644 (file)
--- a/drivers/gpu/arm/midgard/mali_kbase_defs.h
+++ b/drivers/gpu/arm/midgard/mali_kbase_defs.h
@@ -33,7 +33,7 @@
  #include <mali_kbase_mem_lowlevel.h>
  #include <mali_kbase_mmu_hw.h>
  #include <mali_kbase_mmu_mode.h>
-#include <mali_kbase_instr.h>
+#include <mali_kbase_instr_defs.h>
  
  #include <linux/atomic.h>
  #include <linux/mempool.h>
@@ -177,20 +177,18 @@
  #define KBASE_KATOM_FLAG_BEEN_HARD_STOPPED (1<<4)
  /** Atom has caused us to enter disjoint state */
  #define KBASE_KATOM_FLAG_IN_DISJOINT (1<<5)
-/* Atom has fail dependency on same-slot dependency */
-#define KBASE_KATOM_FLAG_FAIL_PREV (1<<6)
  /* Atom blocked on cross-slot dependency */
  #define KBASE_KATOM_FLAG_X_DEP_BLOCKED (1<<7)
  /* Atom has fail dependency on cross-slot dependency */
  #define KBASE_KATOM_FLAG_FAIL_BLOCKER (1<<8)
-/* Atom has been submitted to JSCTX ringbuffers */
-#define KBASE_KATOM_FLAG_JSCTX_RB_SUBMITTED (1<<9)
+/* Atom is currently in the list of atoms blocked on cross-slot dependencies */
+#define KBASE_KATOM_FLAG_JSCTX_IN_X_DEP_LIST (1<<9)
  /* Atom is currently holding a context reference */
  #define KBASE_KATOM_FLAG_HOLDING_CTX_REF (1<<10)
-/* Atom requires GPU to be in secure mode */
-#define KBASE_KATOM_FLAG_SECURE (1<<11)
-/* Atom has been stored in linked list */
-#define KBASE_KATOM_FLAG_JSCTX_IN_LL (1<<12)
+/* Atom requires GPU to be in protected mode */
+#define KBASE_KATOM_FLAG_PROTECTED (1<<11)
+/* Atom has been stored in runnable_tree */
+#define KBASE_KATOM_FLAG_JSCTX_IN_TREE (1<<12)
  
  /* SW related flags about types of JS_COMMAND action
   * NOTE: These must be masked off by JS_COMMAND_MASK */
@@ -237,11 +235,11 @@ struct kbase_jd_atom_dependency {
   *
   * @return readonly reference to dependent ATOM.
   */
-static inline const struct kbase_jd_atom *const kbase_jd_katom_dep_atom(const struct kbase_jd_atom_dependency *dep)
+static inline const struct kbase_jd_atom * kbase_jd_katom_dep_atom(const struct kbase_jd_atom_dependency *dep)
  {
         LOCAL_ASSERT(dep != NULL);
  
-       return (const struct kbase_jd_atom * const)(dep->atom);
+       return (const struct kbase_jd_atom *)(dep->atom);
  }
  
  /**
@@ -252,7 +250,7 @@ static inline const struct kbase_jd_atom *const kbase_jd_katom_dep_atom(const st
   *
   * @return A dependency type value.
   */
-static inline const u8 kbase_jd_katom_dep_type(const struct kbase_jd_atom_dependency *dep)
+static inline u8 kbase_jd_katom_dep_type(const struct kbase_jd_atom_dependency *dep)
  {
         LOCAL_ASSERT(dep != NULL);
  
@@ -303,13 +301,15 @@ enum kbase_atom_gpu_rb_state {
         KBASE_ATOM_GPU_RB_NOT_IN_SLOT_RB,
         /* Atom is in slot ringbuffer but is blocked on a previous atom */
         KBASE_ATOM_GPU_RB_WAITING_BLOCKED,
+       /* Atom is in slot ringbuffer but is waiting for proected mode exit */
+       KBASE_ATOM_GPU_RB_WAITING_PROTECTED_MODE_EXIT,
         /* Atom is in slot ringbuffer but is waiting for cores to become
          * available */
         KBASE_ATOM_GPU_RB_WAITING_FOR_CORE_AVAILABLE,
         /* Atom is in slot ringbuffer but is blocked on affinity */
         KBASE_ATOM_GPU_RB_WAITING_AFFINITY,
-       /* Atom is in slot ringbuffer but is waiting for secure mode switch */
-       KBASE_ATOM_GPU_RB_WAITING_SECURE_MODE,
+       /* Atom is in slot ringbuffer but is waiting for protected mode entry */
+       KBASE_ATOM_GPU_RB_WAITING_PROTECTED_MODE_ENTRY,
         /* Atom is in slot ringbuffer and ready to run */
         KBASE_ATOM_GPU_RB_READY,
         /* Atom is in slot ringbuffer and has been submitted to the GPU */
@@ -319,6 +319,23 @@ enum kbase_atom_gpu_rb_state {
         KBASE_ATOM_GPU_RB_RETURN_TO_JS
  };
  
+enum kbase_atom_exit_protected_state {
+       /*
+        * Starting state:
+        * Check if a transition out of protected mode is required.
+        */
+       KBASE_ATOM_EXIT_PROTECTED_CHECK,
+       /* Wait for the L2 to become idle in preparation for the reset. */
+       KBASE_ATOM_EXIT_PROTECTED_IDLE_L2,
+       /* Issue the protected reset. */
+       KBASE_ATOM_EXIT_PROTECTED_RESET,
+       /*
+        * End state;
+        * Wait for the reset to complete.
+        */
+       KBASE_ATOM_EXIT_PROTECTED_RESET_WAIT,
+};
+
  struct kbase_ext_res {
         u64 gpu_address;
         struct kbase_mem_phy_alloc *alloc;
@@ -335,6 +352,13 @@ struct kbase_jd_atom {
         struct list_head dep_head[2];
         struct list_head dep_item[2];
         const struct kbase_jd_atom_dependency dep[2];
+       /* List head used during job dispatch job_done processing - as
+        * dependencies may not be entirely resolved at this point, we need to
+        * use a separate list head. */
+       struct list_head jd_item;
+       /* true if atom's jd_item is currently on a list. Prevents atom being
+        * processed twice. */
+       bool in_jd_list;
  
         u16 nr_extres;
         struct kbase_ext_res *extres;
@@ -440,6 +464,11 @@ struct kbase_jd_atom {
  
         atomic_t blocked;
  
+       /* Pointer to atom that this atom has same-slot dependency on */
+       struct kbase_jd_atom *pre_dep;
+       /* Pointer to atom that has same-slot dependency on this atom */
+       struct kbase_jd_atom *post_dep;
+
         /* Pointer to atom that this atom has cross-slot dependency on */
         struct kbase_jd_atom *x_pre_dep;
         /* Pointer to atom that has cross-slot dependency on this atom */
@@ -454,6 +483,12 @@ struct kbase_jd_atom {
         struct base_job_fault_event fault_event;
  #endif
  
+       /* List head used for two different purposes:
+        *  1. Overflow list for JS ring buffers. If an atom is ready to run,
+        *     but there is no room in the JS ring buffer, then the atom is put
+        *     on the ring buffer's overflow list using this list node.
+        *  2. List of waiting soft jobs.
+        */
         struct list_head queue;
  
         struct kbase_va_region *jit_addr_reg;
@@ -461,11 +496,18 @@ struct kbase_jd_atom {
         /* If non-zero, this indicates that the atom will fail with the set
          * event_code when the atom is processed. */
         enum base_jd_event_code will_fail_event_code;
+
+       enum kbase_atom_exit_protected_state exit_protected_state;
+
+       struct rb_node runnable_tree_node;
+
+       /* 'Age' of atom relative to other atoms in the context. */
+       u32 age;
  };
  
-static inline bool kbase_jd_katom_is_secure(const struct kbase_jd_atom *katom)
+static inline bool kbase_jd_katom_is_protected(const struct kbase_jd_atom *katom)
  {
-       return (bool)(katom->atom_flags & KBASE_KATOM_FLAG_SECURE);
+       return (bool)(katom->atom_flags & KBASE_KATOM_FLAG_PROTECTED);
  }
  
  /*
@@ -787,27 +829,36 @@ struct kbase_pm_device_data {
  };
  
  /**
- * struct kbase_secure_ops - Platform specific functions for GPU secure mode
- * operations
- * @secure_mode_enable:  Callback to enable secure mode on the GPU
- * @secure_mode_disable: Callback to disable secure mode on the GPU
+ * struct kbase_protected_ops - Platform specific functions for GPU protected
+ * mode operations
+ * @protected_mode_enter: Callback to enter protected mode on the GPU
+ * @protected_mode_reset: Callback to reset the GPU and exit protected mode.
+ * @protected_mode_supported: Callback to check if protected mode is supported.
   */
-struct kbase_secure_ops {
+struct kbase_protected_ops {
         /**
-        * secure_mode_enable() - Enable secure mode on the GPU
+        * protected_mode_enter() - Enter protected mode on the GPU
          * @kbdev:      The kbase device
          *
          * Return: 0 on success, non-zero on error
          */
-       int (*secure_mode_enable)(struct kbase_device *kbdev);
+       int (*protected_mode_enter)(struct kbase_device *kbdev);
  
         /**
-        * secure_mode_disable() - Disable secure mode on the GPU
+        * protected_mode_reset() - Reset the GPU and exit protected mode
          * @kbdev:      The kbase device
          *
          * Return: 0 on success, non-zero on error
          */
-       int (*secure_mode_disable)(struct kbase_device *kbdev);
+       int (*protected_mode_reset)(struct kbase_device *kbdev);
+
+       /**
+        * protected_mode_supported() - Check if protected mode is supported
+        * @kbdev:      The kbase device
+        *
+        * Return: 0 on success, non-zero on error
+        */
+       bool (*protected_mode_supported)(struct kbase_device *kbdev);
  };
  
  
@@ -953,9 +1004,6 @@ struct kbase_device {
                 struct kbase_context *kctx;
                 u64 addr;
  
-               struct kbase_context *suspended_kctx;
-               struct kbase_uk_hwcnt_setup suspended_state;
-
                 struct kbase_instr_backend backend;
         } hwcnt;
  
@@ -971,30 +1019,6 @@ struct kbase_device {
         struct kbase_trace            *trace_rbuf;
  #endif
  
-       /* This is used to override the current job scheduler values for
-        * JS_SCHEDULING_PERIOD_NS
-        * JS_SOFT_STOP_TICKS
-        * JS_SOFT_STOP_TICKS_CL
-        * JS_HARD_STOP_TICKS_SS
-        * JS_HARD_STOP_TICKS_CL
-        * JS_HARD_STOP_TICKS_DUMPING
-        * JS_RESET_TICKS_SS
-        * JS_RESET_TICKS_CL
-        * JS_RESET_TICKS_DUMPING.
-        *
-        * These values are set via the js_timeouts sysfs file.
-        */
-       u32 js_scheduling_period_ns;
-       int js_soft_stop_ticks;
-       int js_soft_stop_ticks_cl;
-       int js_hard_stop_ticks_ss;
-       int js_hard_stop_ticks_cl;
-       int js_hard_stop_ticks_dumping;
-       int js_reset_ticks_ss;
-       int js_reset_ticks_cl;
-       int js_reset_ticks_dumping;
-       bool js_timeouts_updated;
-
         u32 reset_timeout_ms;
  
         struct mutex cacheclean_lock;
@@ -1012,8 +1036,12 @@ struct kbase_device {
         unsigned long current_freq;
         unsigned long current_voltage;
  #ifdef CONFIG_DEVFREQ_THERMAL
+#if LINUX_VERSION_CODE < KERNEL_VERSION(4, 4, 0)
+       struct devfreq_cooling_device *devfreq_cooling;
+#else
         struct thermal_cooling_device *devfreq_cooling;
  #endif
+#endif
  #endif
  
         struct kbase_ipa_context *ipa_ctx;
@@ -1034,6 +1062,11 @@ struct kbase_device {
         /* Root directory for per context entry */
         struct dentry *debugfs_ctx_directory;
  
+#ifdef CONFIG_MALI_DEBUG
+       /* bit for each as, set if there is new data to report */
+       u64 debugfs_as_read_bitmap;
+#endif /* CONFIG_MALI_DEBUG */
+
         /* failed job dump, used for separate debug process */
         wait_queue_head_t job_fault_wq;
         wait_queue_head_t job_fault_resume_wq;
@@ -1103,18 +1136,23 @@ struct kbase_device {
         u32 snoop_enable_smc;
         u32 snoop_disable_smc;
  
-       /* Secure operations */
-       struct kbase_secure_ops *secure_ops;
+       /* Protected operations */
+       struct kbase_protected_ops *protected_ops;
+
+       /*
+        * true when GPU is put into protected mode
+        */
+       bool protected_mode;
  
         /*
-        * true when GPU is put into secure mode
+        * true when GPU is transitioning into or out of protected mode
          */
-       bool secure_mode;
+       bool protected_mode_transition;
  
         /*
-        * true if secure mode is supported
+        * true if protected mode is supported
          */
-       bool secure_mode_support;
+       bool protected_mode_support;
  
  
  #ifdef CONFIG_MALI_DEBUG
@@ -1135,79 +1173,22 @@ struct kbase_device {
         u32 inited_subsys;
  };
  
-/* JSCTX ringbuffer size will always be a power of 2. The idx shift must be:
-   - >=2 (buffer size -> 4)
-   - <= 9 (buffer size 2^(9-1)=256) (technically, 10 works for the ringbuffer
-                               but this is unnecessary as max atoms is 256)
- */
-#define JSCTX_RB_IDX_SHIFT (8U)
-#if ((JSCTX_RB_IDX_SHIFT < 2) || ((3 * JSCTX_RB_IDX_SHIFT) >= 32))
-#error "Invalid ring buffer size for 32bit atomic."
-#endif
-#define JSCTX_RB_SIZE (1U << (JSCTX_RB_IDX_SHIFT - 1U)) /* 1 bit for overflow */
-#define JSCTX_RB_SIZE_STORE (1U << JSCTX_RB_IDX_SHIFT)
-#define JSCTX_RB_MASK (JSCTX_RB_SIZE - 1U)
-#define JSCTX_RB_MASK_STORE (JSCTX_RB_SIZE_STORE - 1U)
-
-#define JSCTX_WR_OFFSET         (0U)
-#define JSCTX_RN_OFFSET         (JSCTX_WR_OFFSET   + JSCTX_RB_IDX_SHIFT)
-#define JSCTX_RD_OFFSET         (JSCTX_RN_OFFSET + JSCTX_RB_IDX_SHIFT)
-
  /**
- * struct jsctx_rb_entry - Ringbuffer entry in &struct jsctx_queue.
- * @atom_id: Atom ID
- */
-struct jsctx_rb_entry {
-       u16 atom_id;
-};
-
-/**
- * struct jsctx_queue - JS context atom queue, containing both ring buffer and linked list.
- * @entries:     Array of size %JSCTX_RB_SIZE which holds the &struct
- *               kbase_jd_atom pointers which make up the contents of the ring
- *               buffer.
- * @indicies:    An atomic variable containing indicies for the ring buffer.
- *               Indicies are of size JSCTX_RB_IDX_SHIFT.
- *               The following are contained:
- *                - WR_IDX - Write index. Index of the NEXT slot to be written.
- *                - RN_IDX - Running index. Index of the tail of the list.
- *                           This is the atom that has been running the longest.
- *                - RD_IDX - Read index. Index of the next atom to be pulled.
- * @queue_head:  Head item of the linked list queue.
- *
- * Locking:
- * The linked list assumes jctx.lock is held.
- * The ringbuffer serves as an intermediary between irq context and non-irq
- * context, without the need for the two to share any lock. irq context can
- * pull (and unpull) and only requires the runpool_irq.lock. While non-irq
- * context can add and remove and only requires holding only jctx.lock.
- * Error handling affecting both, or the whole ringbuffer in general, must
- * hold both locks or otherwise ensure (f.ex deschedule/kill) only that thread
- * is accessing the buffer.
- * This means that RD_IDX is updated by irq-context (pull and unpull) and must
- * hold runpool_irq.lock. While WR_IDX (add) and RN_IDX (remove) is updated by
- * non-irq context and must hold jctx.lock.
- * Note that pull (or sister function peek) must also access WR_IDX to ensure
- * there is free space in the buffer, this is ok as WR_IDX is only increased.
- * A similar situation is apparent with unpull and RN_IDX, but only one atom
- * (already pulled) can cause either remove or unpull, so this will never
- * conflict.
+ * struct jsctx_queue - JS context atom queue
+ * @runnable_tree: Root of RB-tree containing currently runnable atoms on this
+ *                 job slot.
+ * @x_dep_head:    Head item of the linked list of atoms blocked on cross-slot
+ *                 dependencies. Atoms on this list will be moved to the
+ *                 runnable_tree when the blocking atom completes.
   *
- * &struct jsctx_queue is a queue of &struct kbase_jd_atom,
- * part ringbuffer and part linked list.
+ * runpool_irq.lock must be held when accessing this structure.
   */
  struct jsctx_queue {
-       struct jsctx_rb_entry entries[JSCTX_RB_SIZE];
-
-       atomic_t indicies;
-
-       struct list_head queue_head;
+       struct rb_root runnable_tree;
+       struct list_head x_dep_head;
  };
  
  
-
-
-
  #define KBASE_API_VERSION(major, minor) ((((major) & 0xFFF) << 20)  | \
                                          (((minor) & 0xFFF) << 8) | \
                                          ((0 & 0xFF) << 0))
@@ -1334,9 +1315,6 @@ struct kbase_context {
         /* Bitmask of slots that can be pulled from */
         u32 slots_pullable;
  
-       /* true if address space assignment is pending */
-       bool as_pending;
-
         /* Backend specific data */
         struct kbase_context_backend backend;
  
@@ -1359,10 +1337,10 @@ struct kbase_context {
         bool ctx_runnable_ref;
  
         /* Waiting soft-jobs will fail when this timer expires */
-       struct hrtimer soft_event_timeout;
+       struct timer_list soft_job_timeout;
  
         /* JIT allocation management */
-       struct kbase_va_region *jit_alloc[255];
+       struct kbase_va_region *jit_alloc[256];
         struct list_head jit_active_head;
         struct list_head jit_pool_head;
         struct list_head jit_destroy_head;
@@ -1371,6 +1349,12 @@ struct kbase_context {
  
         /* External sticky resource management */
         struct list_head ext_res_meta_head;
+
+       /* Used to record that a drain was requested from atomic context */
+       atomic_t drain_pending;
+
+       /* Current age count, used to determine age for newly submitted atoms */
+       u32 age_count;
  };
  
  /**
@@ -1426,7 +1410,7 @@ static inline bool kbase_device_is_cpu_coherent(struct kbase_device *kbdev)
  }
  
  /* Conversion helpers for setting up high resolution timers */
-#define HR_TIMER_DELAY_MSEC(x) (ns_to_ktime((x)*1000000U))
+#define HR_TIMER_DELAY_MSEC(x) (ns_to_ktime(((u64)(x))*1000000U))
  #define HR_TIMER_DELAY_NSEC(x) (ns_to_ktime(x))
  
  /* Maximum number of loops polling the GPU for a cache flush before we assume it must have completed */